Mock Version: 6.3 Mock Version: 6.3 Mock Version: 6.3 ENTER ['do_with_status'](['bash', '--login', '-c', '/usr/bin/rpmbuild -bs --noclean --target x86_64 --nodeps /builddir/build/SPECS/llama-cpp.spec'], chrootPath='/var/lib/mock/f43-build-60929968-6586012/root'env={'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8'}shell=Falselogger=timeout=201600uid=1000gid=425user='mockbuild'unshare_net=TrueprintOutput=Falsenspawn_args=['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.c5pqu399:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11']) Using nspawn with args ['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.c5pqu399:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11'] Executing command: ['/usr/bin/systemd-nspawn', '-q', '-M', 'be5c48c6fc784920971c71dd710ff5f1', '-D', '/var/lib/mock/f43-build-60929968-6586012/root', '-a', '-u', 'mockbuild', '--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.c5pqu399:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11', '--console=pipe', '--setenv=TERM=vt100', '--setenv=SHELL=/bin/bash', '--setenv=HOME=/builddir', '--setenv=HOSTNAME=mock', '--setenv=PATH=/usr/bin:/bin:/usr/sbin:/sbin', '--setenv=PROMPT_COMMAND=printf "\\033]0;\\007"', '--setenv=PS1= \\s-\\v\\$ ', '--setenv=LANG=C.UTF-8', '--resolv-conf=off', 'bash', '--login', '-c', '/usr/bin/rpmbuild -bs --noclean --target x86_64 --nodeps /builddir/build/SPECS/llama-cpp.spec'] with env {'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8', 'SYSTEMD_NSPAWN_TMPFS_TMP': '0', 'SYSTEMD_SECCOMP': '0'} and shell False Building target platforms: x86_64 Building for target x86_64 setting SOURCE_DATE_EPOCH=1746057600 Wrote: /builddir/build/SRPMS/llama-cpp-b4580-3.fc43.src.rpm Child return code was: 0 ENTER ['do_with_status'](['bash', '--login', '-c', '/usr/bin/rpmbuild -bb --noclean --target x86_64 --nodeps /builddir/build/SPECS/llama-cpp.spec'], chrootPath='/var/lib/mock/f43-build-60929968-6586012/root'env={'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8'}shell=Falselogger=timeout=201600uid=1000gid=425user='mockbuild'unshare_net=TrueprintOutput=Falsenspawn_args=['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.c5pqu399:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11']) Using nspawn with args ['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.c5pqu399:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11'] Executing command: ['/usr/bin/systemd-nspawn', '-q', '-M', 'c78ab1ab43b54856b125546991c3ad4b', '-D', '/var/lib/mock/f43-build-60929968-6586012/root', '-a', '-u', 'mockbuild', '--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.c5pqu399:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11', '--console=pipe', '--setenv=TERM=vt100', '--setenv=SHELL=/bin/bash', '--setenv=HOME=/builddir', '--setenv=HOSTNAME=mock', '--setenv=PATH=/usr/bin:/bin:/usr/sbin:/sbin', '--setenv=PROMPT_COMMAND=printf "\\033]0;\\007"', '--setenv=PS1= \\s-\\v\\$ ', '--setenv=LANG=C.UTF-8', '--resolv-conf=off', 'bash', '--login', '-c', '/usr/bin/rpmbuild -bb --noclean --target x86_64 --nodeps /builddir/build/SPECS/llama-cpp.spec'] with env {'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8', 'SYSTEMD_NSPAWN_TMPFS_TMP': '0', 'SYSTEMD_SECCOMP': '0'} and shell False Building target platforms: x86_64 Building for target x86_64 setting SOURCE_DATE_EPOCH=1746057600 Executing(%mkbuilddir): /bin/sh -e /var/tmp/rpm-tmp.sSgOGa Executing(%prep): /bin/sh -e /var/tmp/rpm-tmp.06RkWu + umask 022 + cd /builddir/build/BUILD/llama-cpp-b4580-build + cd /builddir/build/BUILD/llama-cpp-b4580-build + rm -rf llama.cpp-b4580 + /usr/lib/rpm/rpmuncompress -x /builddir/build/SOURCES/llama.cpp-b4580.tar.gz + STATUS=0 + '[' 0 -ne 0 ']' + cd llama.cpp-b4580 + /usr/bin/chmod -Rf a+rX,u+w,g-w,o-w . + sed -i -e 's/POSITION_INDEPENDENT_CODE ON/POSITION_INDEPENDENT_CODE ON SOVERSION b4580/' src/CMakeLists.txt + sed -i -e 's/POSITION_INDEPENDENT_CODE ON/POSITION_INDEPENDENT_CODE ON SOVERSION b4580/' ggml/src/CMakeLists.txt + sed -i '/target_link_libraries(ggml-hip PRIVATE ggml-base.*/aset_target_properties(ggml-hip PROPERTIES SOVERSION b4580)' ggml/src/ggml-hip/CMakeLists.txt + sed -i '/target_compile_features(${GGML_CPU_NAME} PRIVATE c_std_11.*/aset_target_properties(${GGML_CPU_NAME} PROPERTIES SOVERSION b4580)' ggml/src/ggml-cpu/CMakeLists.txt + sed -i '/#include ' src/llama-mmap.h + rm -rf exmples/llma.android + find . -name .gitignore -exec rm -rf '{}' ';' + RPM_EC=0 ++ jobs -p + exit 0 Executing(%build): /bin/sh -e /var/tmp/rpm-tmp.9umxSn + umask 022 + cd /builddir/build/BUILD/llama-cpp-b4580-build + CFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + cd llama.cpp-b4580 + CFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + /usr/bin/cmake -S . -B redhat-linux-build -DCMAKE_C_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_CXX_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_Fortran_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_VERBOSE_MAKEFILE:BOOL=ON -DCMAKE_INSTALL_DO_STRIP:BOOL=OFF -DCMAKE_INSTALL_PREFIX:PATH=/usr -DCMAKE_INSTALL_FULL_SBINDIR:PATH=/usr/bin -DCMAKE_INSTALL_SBINDIR:PATH=bin -DINCLUDE_INSTALL_DIR:PATH=/usr/include -DLIB_INSTALL_DIR:PATH=/usr/lib64 -DSYSCONF_INSTALL_DIR:PATH=/etc -DSHARE_INSTALL_PREFIX:PATH=/usr/share -DLIB_SUFFIX=64 -DBUILD_SHARED_LIBS:BOOL=ON -DCMAKE_INSTALL_LIBDIR=lib64 -DCMAKE_SKIP_RPATH=ON -DGGML_AVX=OFF -DGGML_AVX2=OFF -DGGML_AVX512=OFF -DGGML_AVX512_VBMI=OFF -DGGML_AVX512_VNNI=OFF -DGGML_FMA=OFF -DGGML_F16C=OFF -DGGML_HIP=ON '-DAMDGPU_TARGETS=gfx900;gfx906:xnack-;gfx908:xnack-;gfx90a:xnack+;gfx90a:xnack-;gfx942;gfx1010;gfx1012;gfx1030;gfx1031;gfx1035;gfx1100;gfx1101;gfx1102;gfx1103;gfx1150;gfx1151;gfx1152;gfx1200;gfx1201' -DLLAMA_BUILD_EXAMPLES=OFF -DLLAMA_BUILD_TESTS=OFF -- The C compiler identification is Clang 19.0.0 -- The CXX compiler identification is Clang 19.0.0 -- Detecting C compiler ABI info -- Detecting C compiler ABI info - done -- Check for working C compiler: /usr/bin/hipcc - skipped -- Detecting C compile features -- Detecting C compile features - done -- Detecting CXX compiler ABI info -- Detecting CXX compiler ABI info - done -- Check for working CXX compiler: /usr/bin/hipcc - skipped -- Detecting CXX compile features -- Detecting CXX compile features - done -- Found Git: /usr/bin/git (found version "2.50.0") fatal: not a git repository (or any of the parent directories): .git fatal: not a git repository (or any of the parent directories): .git sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory -- Setting GGML_NATIVE_DEFAULT to OFF -- Performing Test CMAKE_HAVE_LIBC_PTHREAD -- Performing Test CMAKE_HAVE_LIBC_PTHREAD - Success -- Found Threads: TRUE -- Warning: ccache not found - consider installing it for faster compilation or disable this warning with GGML_CCACHE=OFF -- CMAKE_SYSTEM_PROCESSOR: x86_64 -- Including CPU backend -- Could NOT find OpenMP_C (missing: OpenMP_C_FLAGS OpenMP_C_LIB_NAMES) -- Could NOT find OpenMP_CXX (missing: OpenMP_CXX_FLAGS OpenMP_CXX_LIB_NAMES) -- Could NOT find OpenMP (missing: OpenMP_C_FOUND OpenMP_CXX_FOUND) CMake Warning at ggml/src/ggml-cpu/CMakeLists.txt:54 (message): OpenMP not found Call Stack (most recent call first): ggml/src/CMakeLists.txt:312 (ggml_add_cpu_backend_variant_impl) -- x86 detected -- Adding CPU backend variant ggml-cpu: -msse4.2 GGML_SSE42 CMake Warning at ggml/src/ggml-hip/CMakeLists.txt:27 (message): Setting hipcc as the C++ compiler is legacy behavior. Prefer setting the HIP compiler directly. See README for details. CMake Warning (dev) at /usr/lib64/cmake/hip/hip-config-amd.cmake:70 (message): AMDGPU_TARGETS is deprecated. Please use GPU_TARGETS instead. Call Stack (most recent call first): /usr/lib64/cmake/hip/hip-config.cmake:159 (include) ggml/src/ggml-hip/CMakeLists.txt:39 (find_package) This warning is for project developers. Use -Wno-dev to suppress it. -- Performing Test HIP_CLANG_SUPPORTS_PARALLEL_JOBS -- Performing Test HIP_CLANG_SUPPORTS_PARALLEL_JOBS - Success -- HIP and hipBLAS found -- Including HIP backend fatal: not a git repository (or any of the parent directories): .git fatal: not a git repository (or any of the parent directories): .git CMake Warning at common/CMakeLists.txt:32 (message): Git repository not found; to enable automatic generation of build info, make sure Git is installed and the project is a Git repository. -- Configuring done (9.4s) -- Generating done (0.0s) CMake Warning: Manually-specified variables were not used by the project: CMAKE_Fortran_FLAGS_RELEASE CMAKE_INSTALL_DO_STRIP INCLUDE_INSTALL_DIR LIB_INSTALL_DIR LIB_SUFFIX SHARE_INSTALL_PREFIX SYSCONF_INSTALL_DIR -- Build files have been written to: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build + /usr/bin/cmake --build redhat-linux-build -j8 --verbose Change Dir: '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' Run Build Command(s): /usr/bin/cmake -E env VERBOSE=1 /usr/bin/gmake -f Makefile -j8 /usr/bin/cmake -S/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580 -B/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build --check-build-system CMakeFiles/Makefile.cmake 0 /usr/bin/cmake -E cmake_progress_start /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/CMakeFiles /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build//CMakeFiles/progress.marks /usr/bin/gmake -f CMakeFiles/Makefile2 all gmake[1]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' /usr/bin/gmake -f ggml/src/CMakeFiles/ggml-base.dir/build.make ggml/src/CMakeFiles/ggml-base.dir/depend /usr/bin/gmake -f common/CMakeFiles/build_info.dir/build.make common/CMakeFiles/build_info.dir/depend gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580 /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/CMakeFiles/ggml-base.dir/DependInfo.cmake "--color=" gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' /usr/bin/gmake -f ggml/src/CMakeFiles/ggml-base.dir/build.make ggml/src/CMakeFiles/ggml-base.dir/build gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' [ 0%] Generating build details from Git cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580 && /usr/bin/cmake -DMSVC= -DCMAKE_C_COMPILER_VERSION=19.0.0 -DCMAKE_C_COMPILER_ID=Clang -DCMAKE_VS_PLATFORM_NAME= -DCMAKE_C_COMPILER=/usr/bin/hipcc -P /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/cmake/build-info-gen-cpp.cmake [ 1%] Building C object ggml/src/CMakeFiles/ggml-base.dir/ggml.c.o [ 2%] Building C object ggml/src/CMakeFiles/ggml-base.dir/ggml-alloc.c.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BUILD -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_base_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu11 -fPIC -Wshadow -Wstrict-prototypes -Wpointer-arith -Wmissing-prototypes -Werror=implicit-int -Werror=implicit-function-declaration -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wdouble-promotion -MD -MT ggml/src/CMakeFiles/ggml-base.dir/ggml.c.o -MF CMakeFiles/ggml-base.dir/ggml.c.o.d -o CMakeFiles/ggml-base.dir/ggml.c.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml.c [ 3%] Building CXX object ggml/src/CMakeFiles/ggml-base.dir/ggml-threading.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BUILD -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_base_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu11 -fPIC -Wshadow -Wstrict-prototypes -Wpointer-arith -Wmissing-prototypes -Werror=implicit-int -Werror=implicit-function-declaration -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wdouble-promotion -MD -MT ggml/src/CMakeFiles/ggml-base.dir/ggml-alloc.c.o -MF CMakeFiles/ggml-base.dir/ggml-alloc.c.o.d -o CMakeFiles/ggml-base.dir/ggml-alloc.c.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-alloc.c [ 4%] Building CXX object ggml/src/CMakeFiles/ggml-base.dir/gguf.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BUILD -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_base_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT ggml/src/CMakeFiles/ggml-base.dir/ggml-threading.cpp.o -MF CMakeFiles/ggml-base.dir/ggml-threading.cpp.o.d -o CMakeFiles/ggml-base.dir/ggml-threading.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-threading.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BUILD -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_base_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT ggml/src/CMakeFiles/ggml-base.dir/gguf.cpp.o -MF CMakeFiles/ggml-base.dir/gguf.cpp.o.d -o CMakeFiles/ggml-base.dir/gguf.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/gguf.cpp [ 5%] Building C object ggml/src/CMakeFiles/ggml-base.dir/ggml-quants.c.o [ 6%] Building CXX object ggml/src/CMakeFiles/ggml-base.dir/ggml-opt.cpp.o [ 6%] Building CXX object ggml/src/CMakeFiles/ggml-base.dir/ggml-backend.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BUILD -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_base_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu11 -fPIC -Wshadow -Wstrict-prototypes -Wpointer-arith -Wmissing-prototypes -Werror=implicit-int -Werror=implicit-function-declaration -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wdouble-promotion -MD -MT ggml/src/CMakeFiles/ggml-base.dir/ggml-quants.c.o -MF CMakeFiles/ggml-base.dir/ggml-quants.c.o.d -o CMakeFiles/ggml-base.dir/ggml-quants.c.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-quants.c cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BUILD -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_base_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT ggml/src/CMakeFiles/ggml-base.dir/ggml-backend.cpp.o -MF CMakeFiles/ggml-base.dir/ggml-backend.cpp.o.d -o CMakeFiles/ggml-base.dir/ggml-backend.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-backend.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BUILD -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_base_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT ggml/src/CMakeFiles/ggml-base.dir/ggml-opt.cpp.o -MF CMakeFiles/ggml-base.dir/ggml-opt.cpp.o.d -o CMakeFiles/ggml-base.dir/ggml-opt.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-opt.cpp -- Found Git: /usr/bin/git (found version "2.50.0") fatal: not a git repository (or any of the parent directories): .git fatal: not a git repository (or any of the parent directories): .git sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580 /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common/CMakeFiles/build_info.dir/DependInfo.cmake "--color=" gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' /usr/bin/gmake -f common/CMakeFiles/build_info.dir/build.make common/CMakeFiles/build_info.dir/build gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' [ 7%] Building CXX object common/CMakeFiles/build_info.dir/build-info.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common && /usr/bin/hipcc -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT common/CMakeFiles/build_info.dir/build-info.cpp.o -MF CMakeFiles/build_info.dir/build-info.cpp.o.d -o CMakeFiles/build_info.dir/build-info.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/build-info.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' [ 7%] Built target build_info [ 8%] Linking CXX shared library ../../bin/libggml-base.so cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/cmake -E cmake_link_script CMakeFiles/ggml-base.dir/link.txt --verbose=1 sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory clang++: warning: argument unused during compilation: '-Xarch_host -fstack-protector-strong' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-Xarch_host -fcf-protection' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-specs=/usr/lib/rpm/redhat/redhat-package-notes' [-Wunused-command-line-argument] /usr/bin/hipcc -fPIC -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -Xlinker --dependency-file=CMakeFiles/ggml-base.dir/link.d -Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes -shared -Wl,-soname,libggml-base.so.b4580 -o ../../bin/libggml-base.so.b4580 "CMakeFiles/ggml-base.dir/ggml.c.o" "CMakeFiles/ggml-base.dir/ggml-alloc.c.o" "CMakeFiles/ggml-base.dir/ggml-backend.cpp.o" "CMakeFiles/ggml-base.dir/ggml-opt.cpp.o" "CMakeFiles/ggml-base.dir/ggml-threading.cpp.o" "CMakeFiles/ggml-base.dir/ggml-quants.c.o" "CMakeFiles/ggml-base.dir/gguf.cpp.o" -lm cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/cmake -E cmake_symlink_library ../../bin/libggml-base.so.b4580 ../../bin/libggml-base.so.b4580 ../../bin/libggml-base.so gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' [ 8%] Built target ggml-base /usr/bin/gmake -f ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/build.make ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/depend /usr/bin/gmake -f ggml/src/CMakeFiles/ggml-cpu.dir/build.make ggml/src/CMakeFiles/ggml-cpu.dir/depend gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580 /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/CMakeFiles/ggml-cpu.dir/DependInfo.cmake "--color=" gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580 /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/DependInfo.cmake "--color=" gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' /usr/bin/gmake -f ggml/src/CMakeFiles/ggml-cpu.dir/build.make ggml/src/CMakeFiles/ggml-cpu.dir/build gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' /usr/bin/gmake -f ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/build.make ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/build gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' [ 9%] Building C object ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu.c.o [ 10%] Building CXX object ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu.cpp.o [ 10%] Building CXX object ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-aarch64.cpp.o [ 11%] Building CXX object ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-hbm.cpp.o [ 12%] Building C object ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-quants.c.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_SSE42 -DGGML_USE_CPU_AARCH64 -DGGML_USE_LLAMAFILE -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_cpu_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -msse4.2 -MD -MT ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu.cpp.o -MF CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu.cpp.o.d -o CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu/ggml-cpu.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_SSE42 -DGGML_USE_CPU_AARCH64 -DGGML_USE_LLAMAFILE -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_cpu_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu11 -fPIC -Wshadow -Wstrict-prototypes -Wpointer-arith -Wmissing-prototypes -Werror=implicit-int -Werror=implicit-function-declaration -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wdouble-promotion -msse4.2 -MD -MT ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu.c.o -MF CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu.c.o.d -o CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu.c.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu/ggml-cpu.c cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_SSE42 -DGGML_USE_CPU_AARCH64 -DGGML_USE_LLAMAFILE -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_cpu_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -msse4.2 -MD -MT ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-aarch64.cpp.o -MF CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-aarch64.cpp.o.d -o CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-aarch64.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu/ggml-cpu-aarch64.cpp [ 12%] Building CXX object ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/amx/amx.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_SSE42 -DGGML_USE_CPU_AARCH64 -DGGML_USE_LLAMAFILE -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_cpu_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -msse4.2 -MD -MT ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-hbm.cpp.o -MF CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-hbm.cpp.o.d -o CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-hbm.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu/ggml-cpu-hbm.cpp [ 13%] Building CXX object ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-traits.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_SSE42 -DGGML_USE_CPU_AARCH64 -DGGML_USE_LLAMAFILE -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_cpu_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu11 -fPIC -Wshadow -Wstrict-prototypes -Wpointer-arith -Wmissing-prototypes -Werror=implicit-int -Werror=implicit-function-declaration -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wdouble-promotion -msse4.2 -MD -MT ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-quants.c.o -MF CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-quants.c.o.d -o CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-quants.c.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu/ggml-cpu-quants.c cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_SSE42 -DGGML_USE_CPU_AARCH64 -DGGML_USE_LLAMAFILE -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_cpu_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -msse4.2 -MD -MT ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/amx/amx.cpp.o -MF CMakeFiles/ggml-cpu.dir/ggml-cpu/amx/amx.cpp.o.d -o CMakeFiles/ggml-cpu.dir/ggml-cpu/amx/amx.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu/amx/amx.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_SSE42 -DGGML_USE_CPU_AARCH64 -DGGML_USE_LLAMAFILE -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_cpu_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -msse4.2 -MD -MT ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-traits.cpp.o -MF CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-traits.cpp.o.d -o CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-traits.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu/ggml-cpu-traits.cpp [ 14%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/acc.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/acc.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/acc.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/acc.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory [ 15%] Building CXX object ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/amx/mmq.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_SSE42 -DGGML_USE_CPU_AARCH64 -DGGML_USE_LLAMAFILE -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_cpu_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -msse4.2 -MD -MT ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/amx/mmq.cpp.o -MF CMakeFiles/ggml-cpu.dir/ggml-cpu/amx/mmq.cpp.o.d -o CMakeFiles/ggml-cpu.dir/ggml-cpu/amx/mmq.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu/amx/mmq.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ [ 16%] Building CXX object ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/llamafile/sgemm.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_SSE42 -DGGML_USE_CPU_AARCH64 -DGGML_USE_LLAMAFILE -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_cpu_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -msse4.2 -MD -MT ggml/src/CMakeFiles/ggml-cpu.dir/ggml-cpu/llamafile/sgemm.cpp.o -MF CMakeFiles/ggml-cpu.dir/ggml-cpu/llamafile/sgemm.cpp.o.d -o CMakeFiles/ggml-cpu.dir/ggml-cpu/llamafile/sgemm.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cpu/llamafile/sgemm.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory 6 warnings generated when compiling for gfx1010. [ 17%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/arange.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/arange.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/arange.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/arange.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ [ 17%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/argmax.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/argmax.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/argmax.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/argmax.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu [ 18%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/argsort.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/argsort.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/argsort.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/argsort.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu [ 19%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/binbcast.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/binbcast.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/binbcast.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/binbcast.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu 6 warnings generated when compiling for gfx1012. [ 20%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/clamp.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/clamp.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/clamp.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/clamp.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu [ 21%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/concat.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/concat.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/concat.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/concat.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ [ 22%] Linking CXX shared library ../../bin/libggml-cpu.so cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/cmake -E cmake_link_script CMakeFiles/ggml-cpu.dir/link.txt --verbose=1 sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory 6 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ clang++: warning: argument unused during compilation: '-Xarch_host -fstack-protector-strong' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-Xarch_host -fcf-protection' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-specs=/usr/lib/rpm/redhat/redhat-package-notes' [-Wunused-command-line-argument] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1010. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ 6 warnings generated when compiling for gfx1030. 6 warnings generated when compiling for gfx1010. 9 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx1012. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ 9 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1030. 6 warnings generated when compiling for gfx1030. 6 warnings generated when compiling for gfx1035. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 9 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx1100. 6 warnings generated when compiling for gfx1031. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ 7 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 9 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /usr/bin/hipcc -fPIC -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -Xlinker --dependency-file=CMakeFiles/ggml-cpu.dir/link.d -Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes -shared -Wl,-soname,libggml-cpu.so.b4580 -o ../../bin/libggml-cpu.so.b4580 "CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu.c.o" "CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu.cpp.o" "CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-aarch64.cpp.o" "CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-hbm.cpp.o" "CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-quants.c.o" "CMakeFiles/ggml-cpu.dir/ggml-cpu/ggml-cpu-traits.cpp.o" "CMakeFiles/ggml-cpu.dir/ggml-cpu/amx/amx.cpp.o" "CMakeFiles/ggml-cpu.dir/ggml-cpu/amx/mmq.cpp.o" "CMakeFiles/ggml-cpu.dir/ggml-cpu/llamafile/sgemm.cpp.o" ../../bin/libggml-base.so.b4580 cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/cmake -E cmake_symlink_library ../../bin/libggml-cpu.so.b4580 ../../bin/libggml-cpu.so.b4580 ../../bin/libggml-cpu.so gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' [ 22%] Built target ggml-cpu [ 22%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/conv-transpose-1d.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/conv-transpose-1d.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/conv-transpose-1d.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/conv-transpose-1d.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu 6 warnings generated when compiling for gfx1101. 6 warnings generated when compiling for gfx1035. 6 warnings generated when compiling for gfx1035. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 9 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1100. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1102. 6 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1010. 6 warnings generated when compiling for gfx1100. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); 6 warnings generated when compiling for gfx1103. | ^~~~~~~~~~ 6 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 17 warnings generated when compiling for gfx1012. 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ 9 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1102. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1102. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 17 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1150. 6 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ 7 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1103. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 17 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1151. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1103. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ 9 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | st6 warnings generated when compiling for gfx1150. ruct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1150. 6 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 17 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 9 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1151. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1151. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 6 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 17 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1102. 6 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1151. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ 6 warnings generated when compiling for gfx1152. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 9 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1152. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 6 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 17 warnings generated when compiling for gfx1101. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1152. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ 6 warnings generated when compiling for gfx1200. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 9 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1200. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 6 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 17 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1200. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ 6 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 9 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1201. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 6 warnings generated when compiling for gfx1201. 7 warnings generated when compiling for gfx1150. 17 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1201. 6 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu : 41 : 20 : swarning: tcomparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare]r uct { | 41 ^ | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 9 warnings generated when compiling for gfx1201. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx900. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 6 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx906. 6 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx906. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_6n warnings generated when compiling for gfx906. e1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 17 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ 6 warnings generated when compiling for gfx906. 6 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p06 warnings generated when compiling for gfx908. , const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~6 warnings generated when compiling for gfx908. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 17 warnings generated when compiling for gfx1152. 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx908. 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 6 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ 17 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 9 warnings generated when compiling for gfx908. 6 warnings generated when compiling for gfx942. 7 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/acc.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 6 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ 17 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for host. 9 warnings generated when compiling for gfx90a. [ 23%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/convert.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/convert.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/convert.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/convert.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx942. 7 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx942. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 6 warnings generated when compiling for gfx942. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ 17 warnings generated when compiling for gfx900. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ 9 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/arange.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx942. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ 6 warnings generated when compiling for host. [ 24%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/count-equal.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/count-equal.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/count-equal.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/count-equal.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/clamp.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 13 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cu:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argmax.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for host. [ 25%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/cpy.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/cpy.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/cpy.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/cpy.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu 7 warnings generated when compiling for gfx900. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 6 warnings generated when compiling for host. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ [ 26%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/cross-entropy-loss.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/cross-entropy-loss.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/cross-entropy-loss.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/cross-entropy-loss.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu 17 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/argsort.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for host. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ [ 27%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/diagmask.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/diagmask.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/diagmask.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/diagmask.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ 7 warnings generated when compiling for gfx1010. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 13 warnings generated when compiling for gfx1012. 17 warnings generated when compiling for gfx908. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:41:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 41 | if (blockIdx.y < ne01) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:67:20: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 67 | if (blockIdx.z < ne02) { // src0 | ~~~~~~~~~~ ^ ~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/concat.cu:218:17: warning: 'break' will never be executed [-Wunreachable-code-break] 218 | break; | ^~~~~ 6 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ [ 27%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn-tile-f16.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn-tile-f16.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn-tile-f16.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn-tile-f16.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu 6 warnings generated when compiling for gfx1010. 7 warnings generated when compiling for gfx906. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 6 warnings generated when compiling for gfx1010. 7 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ 17 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hIn file included from :298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 13 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1012. 7 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx908. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 17 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu::11: : In file included from In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh::201: : In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: :/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h171::1719::9 :warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | 171 | s t rsutcrtu c{t {| ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h : 192s:t9r:u cwarning: tanonymous types declared in an anonymous union are an extension [-Wnested-anon-types] { | ^192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hanonymous types declared in an anonymous union are an extension [-Wnested-anon-types]: 213:9 :213 | warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | s tr u c t { st | r ^u ct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h9:: 254warning: :anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]9 : warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]254 | 254 | s t ru cstt r{ u ct| ^ { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h :281281 | : 9 : warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] s t281 | r uc t { | ^ s truct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h : 298:s9tr: ucwarning: tanonymous types declared in an anonymous union are an extension [-Wnested-anon-types] { 298 | | ^ struct { | ^ 6 warnings generated when compiling for gfx1030. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ 13 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ 17 warnings generated when compiling for gfx942. 6 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1031. 7 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1035. 6 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu ^: 33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:33: warning: unused parameter 'p0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:4:47: warning: unused parameter 'd0' [-Wunused-parameter] 4 | const int s0, const int p0, const int d0, const int output_size, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:5:79: warning: unused parameter 'src0_ne3' [-Wunused-parameter] 5 | const int src0_ne0, const int src0_ne1, const int src0_ne2, const int src0_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:39: warning: unused parameter 'src1_ne1' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:59: warning: unused parameter 'src1_ne2' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:6:79: warning: unused parameter 'src1_ne3' [-Wunused-parameter] 6 | const int src1_ne0, const int src1_ne1, const int src1_ne2, const int src1_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:38: warning: unused parameter 'dst_ne1' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:57: warning: unused parameter 'dst_ne2' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:7:76: warning: unused parameter 'dst_ne3' [-Wunused-parameter] 7 | const int dst_ne0, const int dst_ne1, const int dst_ne2, const int dst_ne3, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:78:19: warning: unused variable 'kernel_size' [-Wunused-variable] 78 | const int64_t kernel_size = ggml_nelements(src0); | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/conv-transpose-1d.cu:79:19: warning: unused variable 'input_size' [-Wunused-variable] 79 | const int64_t input_size = ggml_nelements(src1); | ^~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 17 warnings generated when compiling for host. [ 28%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn-tile-f32.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn-tile-f32.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn-tile-f32.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn-tile-f32.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu 30 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h ^ :281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | st/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hru:c298t: {9 : | warning: ^anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ 13 warnings generated when compiling for gfx1035. 6 warnings generated when compiling for gfx1035. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 6 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx1035. 7 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 6 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1101. 13 warnings generated when compiling for gfx1100. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ 6 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1101. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 6 warnings generated when compiling for gfx1101. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ 7 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 13 warnings generated when compiling for gfx1101. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/binbcast.cu:359:11: warning: 'break' will never be executed [-Wunreachable-code-break] 359 | } break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1100. 6 warnings generated when compiling for gfx1102. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 6 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1103. 7 warnings generated when compiling for host. [ 29%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ 30 warnings generated when compiling for gfx1012. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1103. 6 warnings generated when compiling for gfx1103. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 13 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1150. 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ for (int /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hl:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ _meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ :5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1In file included from : In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh::120: : In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh::1711:: 9In file included from :/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh :warning: 20anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: 171warning: | anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | s t r u c t { s t| r ^u ct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | s/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.htr:u192c:t9 :{ warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]| ^ 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | stru/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hc:t213 :9{: warning: | anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] ^ 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hanonymous types declared in an anonymous union are an extension [-Wnested-anon-types] :254: 9254: | warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | st r u c t { s t| ru ^c t { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:9::281 :warning: 9anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | 281 | s t srturcutc t{ { | | ^ ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h::298298::99:: warning: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298298 | | s tsrutrcut ct{ {| ^ | ^ 80 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ 6 warnings generated when compiling for gfx1150. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ 6/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu warning:s580 generated: when compiling for 33gfx1150:. warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ 7 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 13 warnings generated when compiling for gfx1103. 6 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu213: | 6 : /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh : 21 : 19 :st rwarning: uunused parameter 'ne00' [-Wunused-parameter]c t { 21 | | ^ const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h: :warning: 254unused parameter 'ne3' [-Wunused-parameter]: 9: 43warning: | anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | c on s t i nst tnreu3c)t {{ | | ^ ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1151. 80 warnings generated when compiling for gfx1012. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 6 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ 13 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ 30 warnings generated when compiling for gfx1012. 6 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 6 warnings generated when compiling for gfx1152. 7 warnings generated when compiling for gfx1200. 80 warnings generated when compiling for gfx1030. 30 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ 6 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 6 warnings generated when compiling for gfx1200. 7 warnings generated when compiling for gfx1201. 6 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | 13 c warnings generated when compiling for gfx1151. onst int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19:In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested hereIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 80 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 7 warnings generated when compiling for gfx900. 6 warnings generated when compiling for gfx1201. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ 13 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx900. 80 warnings generated when compiling for gfx1035. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 7 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ 30 warnings generated when compiling for gfx1030. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: 13 warnings generated when compiling for gfx1200. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ 7 warnings generated when compiling for gfx908. 30 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 80 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ 7 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ 6 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ 13 warnings generated when compiling for gfx1201. 80 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 7 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ 6 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ 13 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 80 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx900. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ 30 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/count-equal.cu:62:13: warning: 'break' will never be executed [-Wunreachable-code-break] 62 | break; | ^~~~~ 32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ [ 30%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/getrows.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/getrows.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/getrows.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/getrows.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu 13 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/diagmask.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 80 warnings generated when compiling for gfx1103. 6 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ 6 warnings generated when compiling for host. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ [ 31%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/ggml-cuda.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/ggml-cuda.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/ggml-cuda.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/ggml-cuda.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cross-entropy-loss.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ 6 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ 7 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ 6 warnings generated when compiling for host. [ 31%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/gla.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/gla.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/gla.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/gla.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ 13 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ 80 warnings generated when compiling for gfx1150. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ 29 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1012. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ 13 warnings generated when compiling for gfx90a. 6/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ warnings generated when compiling for gfx1010. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ 80 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 29 warnings generated when compiling for gfx1012. 30 warnings generated when compiling for gfx1035. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ 7 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. 30 warnings generated when compiling for gfx1100. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13:In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24:In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_res/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuhu:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k0l0) { | ^ ts | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ 13 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ 80 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 29 warnings generated when compiling for gfx1030. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ 6 warnings generated when compiling for gfx1012. 7 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K,In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ :19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh :1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int n/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ b21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuhb:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ reak; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ 29 warnings generated when compiling for gfx1031. 13 warnings generated when compiling for gfx942. 80 warnings generated when compiling for gfx1200. 7 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ 6 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + b/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuhl:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ ockIdx.x * nint; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *__restrict' to 'type-parameter-0-0 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:467:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 467 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:33:31: warning: cast from 'const void *' to 'int *' drops const qualifier [-Wcast-qual] 33 | const int * x0 = ((int *) vx) + blockIdx.x * nint; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:470:9: note: in instantiation of function template specialization 'dequantize_block_q8_0_f16' requested here 470 | dequantize_block_q8_0_f16<<>>(vx, y, k); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'float *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:635:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 635 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to '__half *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary<__half, float>' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:682:20: note: in instantiation of function template specialization 'convert_unary_cuda<__half, float>' requested here 682 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:580:33: warning: cast from 'const void *' to 'hip_bfloat16 *' drops const qualifier [-Wcast-qual] 580 | const src_t * x = (src_t *) vx; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:588:5: note: in instantiation of function template specialization 'convert_unary' requested here 588 | convert_unary<<>>(vx, y, k); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/convert.cu:684:20: note: in instantiation of function template specialization 'convert_unary_cuda' requested here 684 | return convert_unary_cuda; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ 7 warnings generated when compiling for gfx1100. 13 warnings generated when compiling for host. [ 32%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/im2col.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/im2col.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/im2col.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/im2col.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 29 warnings generated when compiling for gfx1035. 80 warnings generated when compiling for gfx1201. 30 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/cpy.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | s30 warnings generated when compiling for gfx1101. truct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for host. [ 33%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmq.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmq.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmq.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmq.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ 6 warnings generated when compiling for gfx1031. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ 6 warnings generated when compiling for gfx1010. 7 warnings generated when compiling for gfx1101. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ 29 warnings generated when compiling for gfx1100. 80 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 15 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ 6 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ 7 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 29 warnings generated when compiling for gfx1101. 80 warnings generated when compiling for gfx906. 6 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 15 warnings generated when compiling for gfx1012. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ 6 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | 29s warnings generated when compiling for gfx1102. truct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 80 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx1101. 6 warnings generated when compiling for gfx1100. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ 6 warnings generated when compiling for gfx1031. 7 warnings generated when compiling for gfx1150. 30 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 15 warnings generated when compiling for gfx1031. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ 29 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ 80 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1035. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 7 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ 15 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1100. 29 warnings generated when compiling for gfx1150. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ 80 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ 15 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, c/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuhon:st563: 47i:nt warning: &function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] ne0 1563, | csotnatsti ci nvtoi d& osnt_rnidoe_f01at, tnco_nvestc_ icnatse( &c onnes1t0 ,in tc oDns)t { i n t| ^ & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 29 warnings generated when compiling for gfx1151. 80 warnings generated when compiling for gfx942. 7 warnings generated when compiling for gfx1200. 30 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 15 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:6: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:7: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu : 201 :c13o:n swarning: t'break' will never be executed [-Wunreachable-code-break] i nt ne10, | 201 ^ | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh : 31 :19 : warning: unused parameter 'ne11' [-Wunused-parameter] br e31a | k ; | ^~~~~ const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:145:13: warning: 'break' will never be executed [-Wunreachable-code-break] 145 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:118:17: warning: 'break' will never be executed [-Wunreachable-code-break] 118 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:90:17: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:67:21: warning: 'break' will never be executed [-Wunreachable-code-break] 67 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:42:21: warning: 'break' will never be executed [-Wunreachable-code-break] 42 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn.cu:141:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_wmma_f16_case<256, 32, __half>' requested here 141 | ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, half>(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ 80 warnings generated when compiling for host. 7 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ [ 34%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmv.cu.o In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmv.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmv.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmv.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ 6 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h,: 281:c9o:n warning: stanonymous types declared in an anonymous union are an extension [-Wnested-anon-types] in t281 | & st ri d e 1 1 ,st rcuocnts t{ i n| t ^ & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ 29 warnings generated when compiling for gfx1152. 15 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ 7 warnings generated when compiling for gfx900. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ 15 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 29 warnings generated when compiling for gfx1200. 6 warnings generated when compiling for gfx1010. 6 warnings generated when compiling for gfx1150. 6 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h105:: 192warning: :function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn]9 : warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | 172 | _ _sdtervuiccte _{_ _| _ ^f orceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ 7 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ 29 warnings generated when compiling for gfx1201. 30 warnings generated when compiling for gfx1103. 6 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1012. 6 warnings generated when compiling for gfx1151. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ 30 warnings generated when compiling for gfx1150. 15 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ 7 warnings generated when compiling for gfx908. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 29 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 15 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 7 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ 6 warnings generated when compiling for gfx1200. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ 29 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1200. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ 15 warnings generated when compiling for gfx1201. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ 30 warnings generated when compiling for gfx1150. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ 29 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ 6 warnings generated when compiling for gfx900. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 15 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ 6 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/getrows.cu:201:13: warning: 'break' will never be executed [-Wunreachable-code-break] 201 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for host. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ [ 35%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmvq.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmvq.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmvq.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmvq.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu 29 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ 6 warnings generated when compiling for gfx906. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ 15 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_b6 warnings generated when compiling for gfx1100. lock] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { }/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ 0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nro6w warnings generated when compiling for gfx900. s_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncolsIn file included from _/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ y, nrows_dst, s/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ tream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | stru/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ ct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ : warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ :281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_6 warnings generated when compiling for gfx908. x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nr29 warnings generated when compiling for gfx90a. ows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ x.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ warning: unused parameter 'k00' [-Wunused-parameter] 1053 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ const int * __/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ restrict__ x, const int * /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:_98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ _restrict__ y,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ float * __restrict__ sum/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu, const int & k00) { | ^ :126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ (vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ :2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ :126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_bl/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ ock == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | 15 ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ warnings generated when compiling for gfx908. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ 30 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ 6 warnings generated when compiling for gfx1101. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ 29 warnings generated when compiling for gfx942. 15 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:5: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:22: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 132 | char archName[archLen + 1]; | ^~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:132:19: note: read of non-const variable 'archLen' is not allowed in a constant expression /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:131:9: note: declared here 131 | int archLen = strlen(devName); | ^ 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:52: warning: unused parameter 'buffer' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2837:67: warning: unused parameter 'size' [-Wunused-parameter] 2837 | bool ggml_backend_cuda_register_host_buffer(void * buffer, size_t size) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3142:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3142 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3137:13: warning: 'break' will never be executed [-Wunreachable-code-break] 3137 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3134:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3134 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3125:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3125 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3118:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3118 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3113:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3113 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3108:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3108 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3103:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3103 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3061:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3061 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3057:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3057 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:3040:15: warning: 'break' will never be executed [-Wunreachable-code-break] 3040 | } break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/ggml-cuda.cu:2978:13: warning: 'break' will never be executed [-Wunreachable-code-break] 2978 | break; | ^~~~~ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 29 warnings generated when compiling for host. [ 36%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/norm.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/norm.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/norm.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/norm.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu 6 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 15 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/im2col.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for host. [ 36%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/opt-step-adamw.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/opt-step-adamw.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/opt-step-adamw.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/opt-step-adamw.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1103. 6 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cu:90:13: warning: 'break' will never be executed [-Wunreachable-code-break] 90 | break; | ^~~~~ 15 warnings generated when compiling for host. [ 37%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/out-prod.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/out-prod.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/out-prod.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/out-prod.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1012. 6 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1012. 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu::2812:: 9:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh :warning: 318anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]: 23: warning: 281comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] | st 318r | u c t f{o r | ( ^ int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ 20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h | :192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ struct { /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1151. 6 warnings generated when compiling for gfx1030. 6 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/gla.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1152. 30 warnings generated when compiling for gfx1200. 6 warnings generated when compiling for gfx1035. 6 warnings generated when compiling for host. [ 38%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/pad.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/pad.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/pad.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/pad.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx1201. 6 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ 8 warnings generated when compiling for gfx1010. 6 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ 8 warnings generated when compiling for gfx1012. 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1102. 6 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ 8 warnings generated when compiling for gfx1030. 6 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1103. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ 8 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx1103. 6 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h :in213t: 9D:) warning: {anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] | ^ 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ 30 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ 6 warnings generated when compiling for gfx1150. 8 warnings generated when compiling for gfx1035. 6 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1151. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ 8 warnings generated when compiling for gfx1100. 6 warnings generated when compiling for gfx1151. 6 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1152. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ 8 warnings generated when compiling for gfx1101. 30 warnings generated when compiling for gfx900. 6 warnings generated when compiling for gfx1152. 6 warnings generated when compiling for gfx1152. 6 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1200. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ 8 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ 6 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. 30 warnings generated when compiling for gfx906. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1201. 8 warnings generated when compiling for gfx1103. 6 warnings generated when compiling for gfx1201. 6 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx900. 8 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx900. 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 8 warnings generated when compiling for gfx1151. 293 warnings generated when compiling for gfx1010. 6 warnings generated when compiling for gfx906. 6 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx942. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ 8 warnings generated when compiling for gfx1152. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ 6 warnings generated when compiling for gfx908. 6 warnings generated when compiling for gfx908. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | stru/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuct: 80{: 48 :| ^warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hro:ws254:_9p:e rwarning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]_ cud 254a | _ b lo c k ] =s t{r0u.c0ft }{ ; | ^ | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ 6 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmv.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ 281 | struct { /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ 30 warnings generated when compiling for gfx908. 8 warnings generated when compiling for gfx1200. 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for host. [ 39%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/pool2d.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/pool2d.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/pool2d.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/pool2d.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu :17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z <298 ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ 8 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx1010. 30 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ 6 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 8 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx942. 6 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ 6 warnings generated when compiling for gfx1012. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cu:2: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/opt-step-adamw.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/out-prod.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 8 warnings generated when compiling for gfx906. 6 warnings generated when compiling for host. [ 40%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/quantize.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/quantize.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/quantize.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/quantize.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu 6 warnings generated when compiling for gfx942. 6 warnings generated when compiling for host. [ 41%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/rope.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/rope.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/rope.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/rope.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu 6 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/norm.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ 8 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ 30 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for host. [ 41%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/scale.cu.o 15 warnings generated when compiling for gfx1010. cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/scale.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/scale.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/scale.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu 6 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 8 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | 30 warnings generated when compiling for gfx90a. struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1010. 15 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1035. 6 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ 8 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | structIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ 6 warnings generated when compiling for gfx1012. 6 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ 8 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ 6 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:56: warning: comparison of integers of different signs: 'unsigned int' and 'int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pad.cu:17:35: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 17 | if (nidx < ne00 && blockIdx.y < ne01 && blockIdx.z < ne02*ne03) { | ~~~~~~~~~~ ^ ~~~~ 6 warnings generated when compiling for gfx1012. 8 warnings generated when compiling for host. [ 42%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/softmax.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/softmax.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/softmax.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/softmax.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1031. 30 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ 6 warnings generated when compiling for gfx1102. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ 6 warnings generated when compiling for gfx1035. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ 15 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^6 warnings generated when compiling for gfx1030. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 15 warnings generated when compiling for gfx1101. 6 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ 6 warnings generated when compiling for gfx1151. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ 15 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 30 warnings generated when compiling for gfx942. 6 warnings generated when compiling for gfx1030. 6 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx1102. 6 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 15 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:24:19: warning: unused parameter 'ne00' [-Wunused-parameter] 24 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:27:19: warning: unused parameter 'ne03' [-Wunused-parameter] 27 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:28:19: warning: unused parameter 'ne10' [-Wunused-parameter] 28 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:31:19: warning: unused parameter 'ne13' [-Wunused-parameter] 31 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:32:19: warning: unused parameter 'ne31' [-Wunused-parameter] 32 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:33:19: warning: unused parameter 'nb31' [-Wunused-parameter] 33 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:36:19: warning: unused parameter 'nb03' [-Wunused-parameter] 36 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:39:19: warning: unused parameter 'nb13' [-Wunused-parameter] 39 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:40:19: warning: unused parameter 'nb21' [-Wunused-parameter] 40 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:41:19: warning: unused parameter 'nb22' [-Wunused-parameter] 41 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:42:19: warning: unused parameter 'nb23' [-Wunused-parameter] 42 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:43:19: warning: unused parameter 'ne0' [-Wunused-parameter] 43 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:44:19: warning: unused parameter 'ne1' [-Wunused-parameter] 44 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:45:19: warning: unused parameter 'ne2' [-Wunused-parameter] 45 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:46:19: warning: unused parameter 'ne3' [-Wunused-parameter] 46 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:323:13: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<16, 4, false>' requested here 323 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:319:13: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<16, 4, false>' requested here 319 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:293:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 293 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:299:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 299 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f32.cu:344:9: note: in instantiation of function template specialization 'launch_fattn_tile_f32_64_128<32, 1, false>' requested here 344 | launch_fattn_tile_f32_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:294:13: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 294 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:300:13: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 300 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/fattn-tile-f16.cu:348:9: note: in instantiation of function template specialization 'launch_fattn_tile_f16_64_128<32, 1, false>' requested here 348 | launch_fattn_tile_f16_64_128(ctx, dst); | ^ 6 warnings generated when compiling for gfx1103. 30 warnings generated when compiling for host. 6 warnings generated when compiling for gfx1200. [ 43%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/sum.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/sum.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/sum.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/sum.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu 30 warnings generated when compiling for host. [ 44%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/sumrows.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/sumrows.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/sumrows.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/sumrows.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 15 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1201. 6 warnings generated when compiling for gfx1010. 6 warnings generated when compiling for gfx1035. 6 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h s:um213,: 9co:n swarning: tanonymous types declared in an anonymous union are an extension [-Wnested-anon-types] i nt & 213k0 | 0 ) { | ^ struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ 6 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hwarning: :213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct {/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 15 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1151. 6 warnings generated when compiling for gfx1012. 6 warnings generated when compiling for gfx900. 6 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ t { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 15 warnings generated when compiling for gfx1152. 6 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1030. 6 warnings generated when compiling for gfx906. 6 warnings generated when compiling for gfx1100. 6 warnings generated when compiling for gfx1030. 6 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ 15 warnings generated when compiling for gfx1200. 6 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ 6 warnings generated/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ when compiling for gfx1031. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx908. 6 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ 6 warnings generated when compiling for gfx1201. 15 warnings generated when compiling for gfx1201. 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ 6 warnings generated when compiling for gfx1101. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ 6 warnings generated when compiling for gfx900. 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ 6 warnings generated when compiling for /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ gfx1100. 15 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx906. 6 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ 6 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx906. 6 warnings generated when compiling for gfx1103. 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/pool2d.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for host. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ [ 45%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/tsembd.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/tsembd.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/tsembd.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/tsembd.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ 6 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ 15 warnings generated when compiling for gfx908. 6 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1010. 6 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ 15 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1150. 6 warnings generated when compiling for gfx1012. 6 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ 6 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx942. 6 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/scale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1152. 15 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for host. [ 45%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/unary.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/unary.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/unary.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/unary.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu 6 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 293 warnings generated when compiling for gfx1012. 6 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cuh:4: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/quantize.cu:167:13: warning: 'break' will never be executed [-Wunreachable-code-break] 167 | break; | ^~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 15 warnings generated when compiling for host. [ 46%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/upscale.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/upscale.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/upscale.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/upscale.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ 6 warnings generated when compiling for gfx1200. 6 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1010. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ 6 warnings generated when compiling for gfx1035. 6 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ 7 warnings generated when compiling for gfx1010. 6 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1012. 6 warnings generated when compiling for gfx1100. 6 warnings generated when compiling for gfx1201. 6 warnings generated when compiling for gfx1201. 6 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ 6 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1030. 6 warnings generated when compiling for gfx1101. 6 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ 6 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1030. 6 warnings generated when compiling for gfx1102. 6 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]6 warnings generated when compiling for gfx1152. 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx906. 6 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx908. 6 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1035. 6 warnings generated when compiling for gfx1150. 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx1100. 6 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx1200. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 161 warnings generated when compiling for gfx1030. 6 warnings generated when compiling for gfx942. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx942. 6 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sum.cu:10: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ [ 47%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/wkv6.cu.o /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/wkv6.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/wkv6.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/wkv6.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/sumrows.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1102. 6 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for host. [ 48%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu 6 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 7 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 6 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1150. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ 64 warnings generated when compiling for gfx1010. 7 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx942. 6 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx900. 6 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/softmax.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ 7 warnings generated when compiling for gfx1151. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ 476 | launc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ h_fattn(ctx, dst, fatt/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hn:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ _kernel, nwa/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ rps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for host. 6 warnings generated when compiling for gfx1030. [ 49%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu 6 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 64 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ 7 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 6 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 6 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx906. 61 warnings generated when compiling for gfx1010. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1200. 7 warnings generated when compiling for gfx1200. 64 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. 6 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 7 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_com/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hbi:n192e:_r9e:s uwarning: ltanonymous types declared in an anonymous union are an extension [-Wnested-anon-types]s s t| ^r uc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuht: 476:{9 : note: | in instantiation of function template specialization 'launch_fattn<80, 4>' requested here ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281 :4769: | warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | l a u nc h _sftarttunc(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 6 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 61 warnings generated when compiling for gfx1012. 6 warnings generated when compiling for gfx90a. 64 warnings generated when compiling for gfx1031. 6 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 161 warnings generated when compiling for gfx1031. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ 6 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:63 warnings generated when compiling for gfx942. : In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ 505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint3/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh2:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ _t *) &KQ_max_scale) &= f/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuht:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ z_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, trIn file included from u/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ e); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 6 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vxIn file included from ,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu :v1y: In file included from ,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh :d1s: tIn file included from ,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh: n20: c/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.ho:171l:9s:_ xwarning: ,anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] nrow s171 | _ x , n r o swtsr_uy,c tn c{o l| ^s _y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_b/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hl:oc213:k9]: warning: =anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] {0 .213 | 0 f }; | ^~~~s t r| u { }c t {/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu :| 185 ^ :13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hx:,298 :nr9:ow swarning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]_ y, 298n | r o w s _ d s ts)t;r u c| t ^{ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu| : ^230 :5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu | ^~~~: 22 :| 37 { }: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual]/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu :194:13: 22note: | in instantiation of function template specialization 'mul_mat_vec_q' requested here d s194t | [ i n d ex ] = * ( flmoualt_ m*a)t(_(vcech_aqr *<)txy p+e ,i 037 >*< n0)>; > | ( ^v x, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ 7 warnings generated when compiling for gfx906. 61 warnings generated when compiling for gfx1030. 64 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/tsembd.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for host. [ 50%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1102. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 7 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. 61 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 64 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h_:a298tt:n9_:c warning: oanonymous types declared in an anonymous union are an extension [-Wnested-anon-types]m bine _298r | e s u l t s < D ,s tpraurcatl l{e l _| b ^l ocks> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ 6 warnings generated when compiling for gfx1103. 7 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 64 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu::2133:: 9In file included from :/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh :warning: 2anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554: 24213: | warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554s | t r u c t { *| ( ^ (uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ 61 warnings generated when compiling for gfx1035. 7 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 6 warnings generated when compiling for gfx1150. 64 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct {In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 64 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 7 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 6 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 61 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 64 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 6 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/upscale.cu:22:37: warning: cast from 'const float *' to 'char *' drops const qualifier [-Wcast-qual] 22 | dst[index] = *(float *)((char *)x + i03 * nb03 + i02 * nb02 + i01 * nb01 + i00 * nb00); | ^ 7 warnings generated when compiling for host. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ [ 50%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu 64 warnings generated when compiling for gfx1030. 6 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/unary.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ 6 warnings generated when compiling for host. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ [ 51%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu 61 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 64 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 6 warnings generated when compiling for gfx942. 6 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 64 warnings generated when compiling for gfx1010. 64 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 161 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/rope.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 61 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 58 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 64 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ 6 warnings generated when compiling for host. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ [ 52%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq1_s.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq1_s.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq1_s.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq1_s.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h f:lo192a:t9: twarning: manonymous types declared in an anonymous union are an extension [-Wnested-anon-types]p [n c192o | l s _ y ] [ srtoruwcst _{ p | e ^r _cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | floa/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.ht: 298t:m9p:[ nwarning: canonymous types declared in an anonymous union are an extension [-Wnested-anon-types]o ls 298_ | y ] [ r o w s _p estrr_uccut d{a _ b| l ^ ock] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ 64 warnings generated when compiling for gfx1012. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 64 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 6 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 61 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ 58 warnings generated when compiling for gfx1012. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt !In file included from =/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ blockIdx.y) {/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ 2813 | mul_mat_q_strea/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ m_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 64 warnings generated when compiling for gfx1151. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ : warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const intIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uinIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ t32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | In file included from launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *)In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ rallel_blocks>(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_maskIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ ; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, In file included from dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_resultsIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combiIn file included from ne_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ cks> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_resulIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ ts | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, trIn file included from u/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ e); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | */builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h(:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ (uint32_t *) &KQ_max_scale/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ ) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ :3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true)64; | ^ warnings generated when compiling for gfx1030. | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ _attn_combine_resul/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuht:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ s | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5:64 warnings generated when compiling for gfx1100. note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= 61f warnings generated when compiling for gfx1150. tz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 58 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ 9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h :192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ struct { /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h| :213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ 64 warnings generated when compiling for gfx1152. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 64 warnings generated when compiling for gfx1031. 64 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 58 warnings generated when compiling for gfx1031. 61 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 64 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn:(3ct: xIn file included from ,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh :d2s: t/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh, :f554a:24t:t nwarning: _cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual]ke rnel, n554w | a r p s , c o l*s(_(pueirn_tbl32oc_kt, *t)r u&eK,Q _tmrauex)_;s c a| l ^e ) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_perIn file included from _b/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cul:oc3k: ,In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:t2r: u/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhe:, 554t:24r:ue )warning: ;cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] | ^ 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn:( cwarning: tcast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual]x , dst, 554f | a t tn _ k e r n*e(l,( uniwnatr3p2s,_ tc o*)l s&_KpeQr__mbalxo_cskc,a lter) u&e,= tfrtzu_em)a;s k ;| ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu(:c3t: xIn file included from ,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh d:s2t: ,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh :f554at:t24n:_ kwarning: ecast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual]r nel, n wa554r | p s , c o l s _*p(e(ru_ibnlto3c2k_,t t*r)u e&,K Qt_rmuaex)_;s c a| l ^e ) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fatIn file included from tn/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu<:D3, : pIn file included from a/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhr:a2l: l/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhe:l554_:b24l:o cwarning: kscast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual]> (ctx, 554d | s t , f a t t n*(_(ukienrtne32l_,t *n) w&aKrQp_msax,_s ccaolles)_ p&=e rf_tbzl_omacskk,; t r| u ^e , t/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:r704:u5e):; note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here | ^ 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_In file included from re/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cus:ul3t: sIn file included from 554 | | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh : 505 :*5(: (note: uin instantiation of function template specialization 'launch_fattn<112, 1>' requested herei nt32_t 505* | ) & KQl_amunacxh__sfcaatlten)< D&,= pfatrza_lmlaeslk_;b l o| c ^k s>(ctx/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh,: 704d:s5t:, note: fin instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested hereat tn_ ke704r | n e l ,f nlwaashr_psa,t tcno_lcso_mpbeirn_eb_lorcesku,l tts ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combineIn file included from _r/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cue:su3l: tsIn file included from 554| | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh : 476 :*9(: (note: uin instantiation of function template specialization 'launch_fattn<128, 4>' requested herei nt32_t 476* | ) & K Q _ m a xl_asucnaclhe_)fa t&t=n /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh(:c704t:x5,: dnote: sin instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested heret, fa t704t | n _ ke r nfella,sh _nawtatrnp_sc,o mcboilnse__preers_ublltosc ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu: 3 *: (In file included from (/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhu:i2n: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuht:35542:_t24: warning: *cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual]) &KQ _554 | m a x _ s c a *l(e(u)in t&3=2 _tf *t)z &_KQm_amsakx_;sc al | e ^) &= /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhf:t704z_:ma5s:k; note: | in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here ^ 704/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh | : 704 :5 : flnote: ain instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested heres h_at t704n | _ c o m bfilnaes_hr_eastutlnt_sca r a| l ^l el_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhb:l491oc:k9s:> note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here| ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh :491491 | : 9 : note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here lau nc491h | _ f a t t n < D ,l apuanrcahl_lfealt_tbnla(rcatlxl,e ld_sbtl,o cfkast>t(nc_tkxe,r ndestl,, nfwatartpns_k,e rcnoells,_ pnewra_rbplso,c kc,o ltsr_upee,r _tbrluoec)k;, t| r ^u e, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_masIn file included from k/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu;: 3 : | In file included from ^/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh :2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh::704554::245: :warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 554 | 704 | f l a*s((hu_ianttt3n2__cto m*b)i n&eK_Qr_emsauxl_tssc| ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh::704505::55:: note: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested herein instantiation of function template specialization 'launch_fattn<128, 1>' requested here 704 | 505 | f llaasuhn_caht_tfna_tctonma(lcltexl,_ bdlsotc,k sf>a t t| n ^_ ker/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhn:e505l:,5 :n wnote: ain instantiation of function template specialization 'launch_fattn<256, 1>' requested herer ps, co l505s | _ p e rl_baluoncchk_, ftatrtune<,D t,r upea)r;a l l| e ^l _blocks>(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 64 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 64 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 58 warnings generated when compiling for gfx1035. 61 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 6 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 64 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_bloc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hk,: 213t:r9u:e ,warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]tr ue) ; 213 | | ^ struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, col/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hs_:pe298r:_9b:l owarning: canonymous types declared in an anonymous union are an extension [-Wnested-anon-types]k , tr u298e | , t r u e ) ; s t| r ^u ct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | structIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 64 warnings generated when compiling for gfx1100. 64 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 58 warnings generated when compiling for gfx1100. 6 warnings generated when compiling for gfx942. 61 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 161 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter]In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu: 319: | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh :1 : In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh :f20: l/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hoa:t1712:9 : warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] * _ 171_r | e s tr i c t_ s_t rdusctt_m e{t a ,| ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hin:t192 :n9e:0 3warning: ,anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] | ^ 192/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh | : 30 : 19 : warning: unused parameter 'ne10' [-Wunused-parameter] st r30u | c t { | ^ const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h : 213 : 9 :c owarning: nanonymous types declared in an anonymous union are an extension [-Wnested-anon-types]s t in t213 | n b 1 2 , | ^s tr/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhu:c41t: 19{: warning: | unused parameter 'nb13' [-Wunused-parameter] ^ 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 64 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/wkv6.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32In file included from _t/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu :n_3h: eIn file included from a/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhd:_2l: o/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhg:2554,: 24 :| ^warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: 554warning: | unused parameter 'logit_softcap' [-Wunused-parameter] 25 | * (( u in t 3c2o_nts t* )f l&oKaQt_ mlaoxg_sictal_es)o &f= tfctza_mp,a sk ;| ^| ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh::70419:5:: warning: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested hereunused parameter 'ne00' [-Wunused-parameter] 704 | 26 | f la s h _ at t nc_ocnomsbti nien_tr enseu0l0t,s < D| , ^ pa/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhra:l27l:e19l:_ bwarning: lunused parameter 'ne01' [-Wunused-parameter]o ck s27> | | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh :505 :c5:o nsnote: tin instantiation of function template specialization 'launch_fattn<128, 1>' requested here in t505 | n e 0 1l,au n| c ^h _f/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:at28t:n<19D,: pwarning: aunused parameter 'ne02' [-Wunused-parameter]ra l l28el | _ b lo c k s > ( cctonxs, td istn, tf antten_02k,e rn e| ^l ,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh :n29:wa19r:p swarning: ,unused parameter 'ne03' [-Wunused-parameter] co l29s_ | p e r _ b l occokn,s tt riunet, ntreu0e3),; | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 6 warnings generated when compiling for host. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ [ 53%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_s.cu.o In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_s.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_s.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_s.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 64 warnings generated when compiling for gfx1101. 64 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ 58 warnings generated when compiling for gfx1101. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 61 197 warning | s generated when compiling for mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 64 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne0In file included from 0/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ , consIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ t int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ :2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const intIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ & stIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ ride11, const int & ne0, | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devIn file included from i/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ ces[iIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ d].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ :2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh :554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ if (it != blockIdx.x |/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh|:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ ixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ >> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here In file included from 2813/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 64 warnings generated when compiling for gfx1151. 64 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 58 warnings generated when compiling for gfx1102. 61 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 64 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarp/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hs,: 298c:o9l:s _warning: panonymous types declared in an anonymous union are an extension [-Wnested-anon-types]e r_bl o298c | k , t r u e , sttrruuec)t; { | ^| ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 64 warnings generated when compiling for gfx1152. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 64 warnings generated when compiling for gfx1103. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | 58 l warningasu generatedn when compiling for cgfx1103h. _mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 61 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 64 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 58 warnings generated when compiling for gfx1150. 64 warnings generated when compiling for gfx1200. 64 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 61 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 64 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh: 563554: | 47 : warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563*( | (stuatinitc3 2v_oti d* ) o&nKQ__mnaxo_s_cfaaltet)n &_= vefct_z_cmaasske; ( | co ^ nst/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh :i704:n5:t note: Din instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here) { 704 | | ^ flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 58 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 64 warnings generated when compiling for gfx1151. 64 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 61 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 64 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13In file included from ,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu :| 3 ^: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh::234: :/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh19::554 :warning: 24unused parameter 'ne31' [-Wunused-parameter]: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual]34 | 554 | c o n s t i nt* (ne(3u1i,n t 3| 2 ^_ t /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh*:)35 :&19K:Q _warning: munused parameter 'nb31' [-Wunused-parameter]a x_ s35ca | l e ) & = f ctoz_nmsats ki;n t n| ^b 31, | ^/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh :704/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh::536:: 19note: :in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here warning: unused parameter 'nb01' [-Wunused-parameter] 70436 | | f l a s hc_oantsttn _icnotm bnibn0e1_,r e s| u ^l ts/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh<:D37,: 19p:a rwarning: alunused parameter 'nb02' [-Wunused-parameter]l el _37b | l o c k s > | c ^o nst/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh :i491nt: 9:n b0note: 2in instantiation of function template specialization 'launch_fattn<96, 2>' requested here, | ^491 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh: 38 : 19: lawarning: ununused parameter 'nb03' [-Wunused-parameter]c h _38f | a t t n b(0c3t,x , d| st ^ ,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh f:a39t:t19n:_ kwarning: eunused parameter 'nb11' [-Wunused-parameter]r ne l,39 | n w a rcopnsst ,i ncto lnsb_p1e1r,_b l | o ^ ck/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:,40 :t19:r uwarning: e,unused parameter 'nb12' [-Wunused-parameter] t 40r | u e ) ; | ^co nst int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 58 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 64 warnings generated when compiling for gfx1152. 64 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 161 warnings generated when compiling for gfx1101. 61 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 64 warnings generated when compiling for host. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ [ 54%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu.o In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ 58 warnings generated when compiling for gfx1200. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mulIn file included from _m/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cuat:_3v: eIn file included from c_q/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh_:c2: ud/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuha:(vx, v y318, | d s t , fnocro l(si_nxt, ln r=o w0s;_ xl, ' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu, : 80| : ^48 : /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhwarning: :suggest braces around initialization of subobject [-Wmissing-braces]21 :21: warning: unused parameter 'max_bias' [-Wunused-parameter] 80 | 21 | f l o caotn sttm fpl[onatc moalxs__byi]a[sr,o w s_| p ^e r_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:c22:u21d:a _warning: bunused parameter 'm0' [-Wunused-parameter]lo c k22] | = { 0 . 0cfo}n;s t | ^~~~fl oa t | { }m0 , | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu ^: 185/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh::1323:: 21note: :in instantiation of function template specialization 'mul_mat_vec_q' requested here warning: unused parameter 'm1' [-Wunused-parameter] 23185 | | c o n s tm ufll_omaatt _mv1e,c _ q| 24<:< e>a>d(_vlxo,g 2v,y , | d ^s t,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh :nc25o:l21s:_ xwarning: unused parameter 'logit_softcap' [-Wunused-parameter], nr o25w | s _ x , n r o wcso_nys,t nfrloowast_ dlsto)g;i t _| s ^of tca/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cup:,237 : 5| : ^ note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh :26:19: 237warning: | unused parameter 'ne00' [-Wunused-parameter] 26m | u l _ m a t _ vceocn_sqt_ ciundta :(19v: xwarning: ,unused parameter 'ne01' [-Wunused-parameter] vy, 27d | s t , n c o l sc_oxn,s tn rionwts _nxe,0 1n,r o w| s ^_ y,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh :nc28o:l19s:_ ywarning: ,unused parameter 'ne02' [-Wunused-parameter] nr o28w | s _ d s tc, osnsttre ianmt); ne 0| 2 ^, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu 46: | 80 : 48 : warning: suggest braces around initialization of subobject [-Wmissing-braces] const in t80 | n e 1 , f l| o ^a t /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuht:m47p:[19n:c owarning: lunused parameter 'ne2' [-Wunused-parameter]s _y ]47[ | r o w s _ p e r _ccoundsat_ bilnotc kn]e 2=, { 0| . ^0 f}/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh;: 48 :| 19 ^~~~: warning: | unused parameter 'ne3' [-Wunused-parameter] { } 48 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu : 188 : 13 : cnote: oin instantiation of function template specialization 'mul_mat_vec_q' requested heren st int n188e | 3 ) { | ^ mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>> (554 | v x , v y ,* (d(sutin, t3n2c_otl s_x*) ,& KnQ_max_rscale) &=o fwts_zx_,m anskr; o | w ^s _y, /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhn:704r:o5w: snote: _in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here dst )704; | | f ^l ash/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu_:at307t:n5_:co mbnote: inin instantiation of function template specialization 'mul_mat_vec_q_cuda' requested heree _re 307su | l t s < Dm,ul p_armaalltel__bvelco_cqk_sc> ud a| < ^G GM/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhL:491_:9T:YP Enote: _in instantiation of function template specialization 'launch_fattn<64, 2>' requested hereI Q1_ 491S | > ( v x , lvauyn,ch d_fsatttn, (,c tnx,r dowsts, _fya,t tnnc_oklesr_neyl,, nnwraorwps_s,ds tc,o lsst_rpeera_bmlo);ck , t| r ^u e, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncIn file included from o/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.culs:_3y: ]In file included from [/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:r2: o/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhw:s554:_24p: ewarning: rcast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual]_ cud a554_ | b l oc k ] =* ({(0u.0ifn}t;3 2 _| t ^~~~ * ) | { }& KQ_m/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cua:x_191sc:13al:e )note: in instantiation of function template specialization 'mul_mat_vec_q' requested here& = ft z191_ | m a sk ; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhm:u704l:5_: mnote: ain instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested heret _v 704e | c _ qfc , | s ^t rea/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhm:>>476:>9(:v xnote: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here, vy , 476d | st , n c o l s _lxa,un nchr_fowatstn_(sc_tdxs,t )d;st , f| a ^tt n_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuk:e307r:n5e:l ,note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested heren war ps307, | c o l s_mpuelr_m_abtl_ovcke, ct_rqu_ec, udtra(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_In file included from m/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cuat:3_: vIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhe:2c_: q/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh_:cu554d:a24<:G Gwarning: Mcast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual]L _TY 554P | E _ I Q 1_ M >*((v(uxi,n tv3y2,_ t d*s)t ,& KnQc_omlasx__xsc, anlreow)s &_= x,f tnz_rmaowsks;_ y , | n ^ col/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:s704_:y5, :n rnote: owin instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here s_ d704 | s t , fsltarseh_amat)t;n _c o| mb ^in e_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncoIn file included from l/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cus_:y3: ]In file included from [/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhr:ow2: s/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh_:p554e:24r: _warning: ccast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual]u da_ b554 | l o ck ] = {*0((.u0ifnt}32;_ t | *) ^~~~ & K Q_| m { }ax _sca/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cul:194e:)13 :&= note: in instantiation of function template specialization 'mul_mat_vec_q' requested hereft z_m as194k | ; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh : 704 :5 : m note: uin instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested herel _m 704a | t _ v e cf_laqsh<_atytptne_c, om7bi>ne<_, | 0 ^, s/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuht:r491e:a9m:>> >note: (vin instantiation of function template specialization 'launch_fattn<96, 2>' requested herex , vy 491, | d s t , n c loaulsnc_h_xfa,t tnnr(ncrtxow, sds_dts, tfa)tt;n_ k| e ^rn el/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu,: 314n:w5a:r pnote: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested heres, co ls314_p | e r _b lomcku,l _tmruae,t t_vrueec);_ q| ^_ cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results: 80| : ^48 : warning: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhsuggest braces around initialization of subobject [-Wmissing-braces]: 505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 80 | 505f | l o a t tlmapu[nnccho_lfsa_tyt]n[]( c=t x{,0 .d0sft},; f a| t ^~~~tn _ | k { }e rnel, n/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuw:a176r:p13s:, note: cin instantiation of function template specialization 'mul_mat_vec_q' requested hereo ls_per_ b176l | o ck , tr u e , tr u e)m;u l _| m ^a t_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<: >In file included from >/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh(:v2x: ,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh :v554y:,24 :d swarning: t,cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] ncols_ x554, | n r ow s _ x, * (nr(ouwisn_ty3,2 _ntr o*ws) _&dKsQ_tma)x;_ s ca| ^le ) /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu&=:321 f:t5z:_m asnote: kin instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here; | ^321 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh :704 :m5u:l _note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested herem at_ 704v | e c _fqla_shcu_datat<(Dv, xpa, ravlyl,e dl_sblto,c ksn> c o| l ^s _x/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh,:476 :n9r:o wnote: in instantiation of function template specialization 'launch_fattn<112, 4>' requested heres _x, 476n | r o w s _y ,l nacunoclhs__fya,t tnnr( c tx| , ^ dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu :80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh::80491::948:: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested herewarning: suggest braces around initialization of subobject [-Wmissing-braces] 491 | 80 | l au nfclh_ofaattt ntw(sct_xp,e rds_tc, ufdaatt_nb_lkoecrkn]e l=, {n0w.a0rfp}s;, c| o ^~~~l s _p| e { }r _bloc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuk,:185 :t13ru:e ,note: tin instantiation of function template specialization 'mul_mat_vec_q' requested hereru e); 185 | | ^ mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, In file included from ds/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cut:,3 : nIn file included from c/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhol:2s: _/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhx:,554 n:r24o:w swarning: _cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual]x , nrows _554y | , n r o ws _ *d(st()u;i n t| 32 ^_ t /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu*): 328&:K5Q: _note: min instantiation of function template specialization 'mul_mat_vec_q_cuda' requested herea x_scal e328) | & = mfutlz__mmaastk_v; e c| _q ^_ cud/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuha:704<:G5:G Mnote: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested hereL _T Y704P | E _ I Q4 f_laXsSh>_(avxtt,n _vcyo,m bidnes_tr,e sunltcso w| s ^ _y/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:,505 :n5c:o lnote: sin instantiation of function template specialization 'launch_fattn<128, 1>' requested here_ y, n505r | o ws _ldsatu, nscht_refaatmtn)(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ 64 warnings generated when compiling for gfx1200. 64 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 61 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3)/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh {: 2691 | : ^36 : warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 58 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 64 warnings generated when compiling for gfx1201. 64 warnings generated when compiling for gfx908. 61 warnings generated when compiling for host. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ [ 54%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struIn file included from c/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ t { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 58 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 64 warnings generated when compiling for gfx900. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 64 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 58 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 64 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 64 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu2805: | 3 : /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh : 14 : 35 :m uwarning: lunused parameter 'Q' [-Wunused-parameter]_ mat_q_ s14t | r e a m _ k _ f icxounps:< > > | ^| ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:162852:35::13 :warning: unused parameter 'V' [-Wunused-parameter]note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 16 | 2852 | c o n st clhaaurn ch*_ _m_url_esmtartic_t_q_< tVy,p e | , ^ 8/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh>:(17c:tx35,: warning: arunused parameter 'mask' [-Wunused-parameter]g s, s17tr | e am ) ; | ^c ons/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuht :c2691h:ar16 :* _warning: _comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]re str 2691i | c t _ _ m aisf k(,i t !| = ^ b/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhl:18o:c35k:I dwarning: xunused parameter 'dst' [-Wunused-parameter]. x |18| | jt ! = b l oc kIfdlxo.ayt) { * _| _ ~~ ^ ~~~~~~~~~~r estrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh37::192691:: warning: 36unused parameter 'nb02' [-Wunused-parameter]: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]37 | 2691c | o n s t i n t inb02f, ( | i ^t !/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh=: b38l:o19:ck Iwarning: unused parameter 'nb03' [-Wunused-parameter]dx .x 38| | | j t ! = cbolnosctk Iidnxt. yn)b 0{3 , | ~~ ^ ~~~~~~~~~~| ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh::192813:: 9warning: :unused parameter 'nb11' [-Wunused-parameter] note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 39 | 2813 | c on st i nmtu nlb_m11at, _ q_| ^s tre/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuha:m40_:k19_:f iwarning: xunused parameter 'nb12' [-Wunused-parameter]u p:19<:<< bwarning: unused parameter 'nb13' [-Wunused-parameter]l ock _41n | u m s _ x y _ t icloinnsgt, ibnlto cnkb_1d3i,m s ,| ^0 , /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhs:tr42e:a19:m >>warning: >unused parameter 'nb21' [-Wunused-parameter] | ^42 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh: 2852 : 13 : note: coin instantiation of function template specialization 'launch_mul_mat_q' requested here nst i n2852t | n b 2 1 , | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhla:u43:n19c:h _warning: munused parameter 'nb22' [-Wunused-parameter]u l_m a43t | _ q < t y p e , c o n8s>t( citnxt, nabr2g2s,, s| t ^r ea/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuhm:);44 :19 | : ^ warning: unused parameter 'nb23' [-Wunused-parameter] 44/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh | : 2691 :16 : warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]c onst 2691i | nt n b 2 3 , i f| ^ (it/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh :!45=: 19b:l owarning: cunused parameter 'ne0' [-Wunused-parameter]k Idx .45x | | | j t ! =c obnlsotc kiIndtx .nye)0 ,{ | ^| ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :| ^2691 :36:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh :warning: 704comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]:5 : note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 2691 | 704 | f l aisfh _(aittt n!_=c obmlboicnkeI_drxe.sxu l|t|s | | ~~ ^ ~~~~~~~~~~ ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh5:: 2805note: :9in instantiation of function template specialization 'launch_fattn<64, 1>' requested here: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 505 | 2805 | l a un c h _ fa tmutln<_Dma,t p_qa_rasltrleela_mb_lko_cfkixsu>(pc_>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<(>u> i n| ^t 32_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuht: *2897):13 :& Knote: Qin instantiation of function template specialization 'launch_mul_mat_q' requested here_ ma x_2897s | c a le ) & = f t zl_maausnckh;_ m u| l ^_ mat_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhq:<704t:y5:p enote: ,in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 1 28> (704c | t x ,f laarsgh_sa,tt ns_ctomrbeianme)_;r e| ^s ult/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhs:<2691D:,16 :p awarning: rcomparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]a lle l_2691b | l o c k s > | i ^f (/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:i505t :!5=: b lnote: oin instantiation of function template specialization 'launch_fattn<128, 1>' requested herec kIdx .505x | | | j t l!a= ubnlocchk_fIatdtnx(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 58 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 64 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ 64 warnings generated when compiling for gfx942. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 58 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ 161 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 64 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 64 warnings generated when compiling for host. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ [ 55%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq3_s.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq3_s.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq3_s.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq3_s.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 58 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ 64 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mIn file included from at/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu_:q3<: tyIn file included from pe/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh,: 12: 28/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:>(554c:tx24, : awarning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual]rg s, 554s | t re am ) ; *| ^( (ui/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhn:t26913:162_:t *warning: ) comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]&K Q_ m2691 | a x _s ca le ) & = iff (titz !_=ma skb; l | o ^c kId/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhx:.x704 :|5|: jnote: tin instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here ! = b l704o | c k I d xf.laysh)_a t{ t n| _ ~~ ^ ~~~~~~~~~~c ombine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 58 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 64 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ 58 warnings generated when compiling for host. [ 56%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:14:35: warning: unused parameter 'Q' [-Wunused-parameter] 14 | const char * __restrict__ Q, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:15:35: warning: unused parameter 'K' [-Wunused-parameter] 15 | const char * __restrict__ K, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:16:35: warning: unused parameter 'V' [-Wunused-parameter] 16 | const char * __restrict__ V, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:17:35: warning: unused parameter 'mask' [-Wunused-parameter] 17 | const char * __restrict__ mask, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:18:35: warning: unused parameter 'dst' [-Wunused-parameter] 18 | float * __restrict__ dst, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:19:35: warning: unused parameter 'dst_meta' [-Wunused-parameter] 19 | float2 * __restrict__ dst_meta, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:20:21: warning: unused parameter 'scale' [-Wunused-parameter] 20 | const float scale, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:21:21: warning: unused parameter 'max_bias' [-Wunused-parameter] 21 | const float max_bias, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:22:21: warning: unused parameter 'm0' [-Wunused-parameter] 22 | const float m0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:23:21: warning: unused parameter 'm1' [-Wunused-parameter] 23 | const float m1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:24:24: warning: unused parameter 'n_head_log2' [-Wunused-parameter] 24 | const uint32_t n_head_log2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:25:21: warning: unused parameter 'logit_softcap' [-Wunused-parameter] 25 | const float logit_softcap, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:26:19: warning: unused parameter 'ne00' [-Wunused-parameter] 26 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:27:19: warning: unused parameter 'ne01' [-Wunused-parameter] 27 | const int ne01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:28:19: warning: unused parameter 'ne02' [-Wunused-parameter] 28 | const int ne02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:29:19: warning: unused parameter 'ne03' [-Wunused-parameter] 29 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:30:19: warning: unused parameter 'ne10' [-Wunused-parameter] 30 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:31:19: warning: unused parameter 'ne11' [-Wunused-parameter] 31 | const int ne11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:32:19: warning: unused parameter 'ne12' [-Wunused-parameter] 32 | const int ne12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:33:19: warning: unused parameter 'ne13' [-Wunused-parameter] 33 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:34:19: warning: unused parameter 'ne31' [-Wunused-parameter] 34 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:35:19: warning: unused parameter 'nb31' [-Wunused-parameter] 35 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:36:19: warning: unused parameter 'nb01' [-Wunused-parameter] 36 | const int nb01, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:37:19: warning: unused parameter 'nb02' [-Wunused-parameter] 37 | const int nb02, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:38:19: warning: unused parameter 'nb03' [-Wunused-parameter] 38 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:39:19: warning: unused parameter 'nb11' [-Wunused-parameter] 39 | const int nb11, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:40:19: warning: unused parameter 'nb12' [-Wunused-parameter] 40 | const int nb12, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:41:19: warning: unused parameter 'nb13' [-Wunused-parameter] 41 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:42:19: warning: unused parameter 'nb21' [-Wunused-parameter] 42 | const int nb21, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:43:19: warning: unused parameter 'nb22' [-Wunused-parameter] 43 | const int nb22, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:44:19: warning: unused parameter 'nb23' [-Wunused-parameter] 44 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:45:19: warning: unused parameter 'ne0' [-Wunused-parameter] 45 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:46:19: warning: unused parameter 'ne1' [-Wunused-parameter] 46 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:47:19: warning: unused parameter 'ne2' [-Wunused-parameter] 47 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:48:19: warning: unused parameter 'ne3' [-Wunused-parameter] 48 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<64, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<80, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<80, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<80, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<80, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<96, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<96, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<96, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<96, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<112, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<112, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<112, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<112, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<128, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:476:9: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 476 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 2>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:491:9: note: in instantiation of function template specialization 'launch_fattn<256, 2>' requested here 491 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-wmma-f16.cuh:505:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 505 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, true, true); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ 64 warnings generated when compiling for host. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ [ 57%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ 78 warnings generated when compiling for gfx1010. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 161 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ 78 warnings generated when compiling for gfx1012. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 161 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1012. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1030. 78 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | In file included from mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ :281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 161 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ 78 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1012. 78 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stre/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:am213_:k9_:f iwarning: xanonymous types declared in an anonymous union are an extension [-Wnested-anon-types]u p<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh298::28139::9 :warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 298 | 2813 | st r uc t mu{l _ m| a ^t _q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1030. 78 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 293 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ const mma_int_B_J8K4 & mma_B) { /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh| ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ :2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stre/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuham); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ :1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, d/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ st, ncols_x, nrows_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ x, nrows_y, nrows_dst);/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ 230 | mul_ma/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.ht:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ _vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 In file included from |/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ | row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, nconst int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ rows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_bl/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ock == 1 || row0 + threadIdx.x < nrows_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (thr/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhe:a2691:d36Id:x .warning: x comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]< rows _2691p | er _c u d a _iblfo c(ikt & !&= (rbolwosc_pkeIrdx_.cuxd |a_|b ljotc k !=== bl1o |c|k Idrox.w0y ) +{ t h | r ~~ ^ ~~~~~~~~~~ea dIdx/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh.:x 2805<:9 n: rnote: oin instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested herew s_d s2805t | ) ) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~m ul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (i/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cut :!80=: 48b:l owarning: csuggest braces around initialization of subobject [-Wmissing-braces]k Idx.x || 80j | t ! = fbllooactk Itdmxp.[yn)c o{l s _| y ~~ ^ ~~~~~~~~~~] [rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh>_>cu d a| _ ^b loc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:k 2855:=13= :1 note: |in instantiation of function template specialization 'launch_mul_mat_q' requested here| r 2855ow | 0 + t h r e a dI dlx.auxn (ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ , vy, dst, ncols_x, nrows_x, nrows_y, nc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ _q<<' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ , stream>>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_ds/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuht:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ )) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stre/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuha:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ m); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ dst, ncols_x, nrows_x, nrows_y, nrows_dst/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ float tmp[ncols_y][rows_per_cuda_b/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ lock] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ if (threadIdx.x < rows_per_cuda_bl/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ock && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ TYPE_IQ2_XS>(vx, vy, dst, ncols_x, nrow/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhs:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ _x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | m/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ul_mat_vec_q<<' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ k_dims, 0, stream>>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrow/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhs:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ _dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ nrows_y, ncols_y, nrows_dst, stream);/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ >>>(vx, vy, dst, ncols_x, nrows_x, nro/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ws_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ 78 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1100. 78 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1031. 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh_:_2691r:es36:tr iwarning: ccomparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] t__ x, c2691on | s t i n t * if_ _r(eistt r!i=c tb_l_o cyk,I dxfl.xoa t|| * j t__ r!e=s tbrliocctk_I_dx .syu)m ,{ c o n| ~~ ^ ~~~~~~~~~~s t in/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuht: 2813&: 9k:0 0note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here) { | ^2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:9::2691 :note: 36in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2805 | m2691u | l _m a t _ q _ s tirfe a(mi_kt_ !fi=x bulp<<' requested here b lock_d i2805m | s , 0 , s t r emauml>_>m>a t _| q ^_ str/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhe:a2897m:_13k_:f note: iin instantiation of function template specialization 'launch_mul_mat_q' requested herexu pq<_(ncutmxs,_ xayr_gtsi,l isntgr,e abml)o;c k _| d ^i ms, 0,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :s2691t:r16e:a mwarning: >>comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]> | ^ 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh : 2852 : 13 :i fnote: in instantiation of function template specialization 'launch_mul_mat_q' requested here( it ! =2852 | b l o c kI dx . x | | ljatu n!c=h _bmluolc_kmIadtx_.qy<)t y{p e ,| ~~ ^ ~~~~~~~~~~ 8>(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != block/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhId:x2691.:x 36|:| warning: jcomparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]t != b2691l | o c k I d x . yi)f ({i t !=| ~~ ^ ~~~~~~~~~~b loc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:kI2813:d9x: .note: xin instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here || j2813t | ! = b l o c k Imduxl.y_)m a{ t _q| _ ~~ ^ ~~~~~~~~~~s tre/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuham:_k2813_f:ix9up:' requested here, mm q2813_ | x , M M Q_ N W AmRuPlS_,m naete_qd__sctherceak>m<<_k<_bfilxoucpk<_tnyupmse_x,y _mtmqil_xin,g ,M MbQl_ocNkW_AdRiPmSs,, 0,n esetrde_acmh>e>c>k > <| < ^< bl/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:o2897:ck13:_n note: uin instantiation of function template specialization 'launch_mul_mat_q' requested herem s_ xy2897_ | t i l i n g, bllauoncckh__dmimus,l_ ma0t_,q< tyspet,r e12a8>m>(>c>t x| ^, a/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:rg2852:s13:, note: in instantiation of function template specialization 'launch_mul_mat_q' requested heres tr e2852a | m) ; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh: 2691 :l16a: uwarning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]n ch _2691 | m u l _ m at _q (cbtlxo,c kaIrdxg.xs , |s|t jrt e!=a mb)l;o c k| I ^d x.y)/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh: 2691{: 16 : | ~~ ^ ~~~~~~~~~~warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 293 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1035. 78 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ : warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != bloc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhk:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ Idx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 2691 | if (it != blockIdx.x || /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhj:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ t != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 2691 | if (it != blockIdx.x || jt !=/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1035. 78 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1101. 78 warnings generated when compiling for gfx1100. 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<&>> n e0| 0, ^ co/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhn:s2870t: 13i:n tnote: in instantiation of function template specialization 'launch_mul_mat_q' requested here& n e2870 | 0 1 , co n s t i nlatu n&c hst_rimduel0_m1at,_q e(1c0t,x ,c oanrsgts ,i nstt r&e anme)1;1 , | c ^o nst in/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuht: 2691&: 16s:tr iwarning: dcomparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]e 11, co2691n | s t i n t & infe 0(,i t | ! ^= bloc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhk:I2497d:x75.:x warning: |unused parameter 'ne10' [-Wunused-parameter]| jt != b l2497o | c k I d xc.oyn)s t{ i n| t ~~ ^ ~~~~~~~~~~ & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h!:= 254b:l9o: cwarning: kanonymous types declared in an anonymous union are an extension [-Wnested-anon-types]I dx .254x | | | jsttr u!c= tb l{ o ck| ^I dx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 293 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ 78 warnings generated when compiling for gfx1101. 78 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh78 warnings generated when compiling for gfx1101. :2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. 293 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_i/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ nt_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh ~~ ^ ~~~~~~~~~~ :1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ :2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ s, 0, stream>>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ eck><<' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ims, 0, stream>>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ype, mmq_x, MMQ_NWARPS, need_check><<' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ block_nums_xy_tiling, block_dims, 0, stream>>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mu/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ l_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ :2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ :2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != bloc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ kIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh{: 2691 :| 36 ~~ ^ ~~~~~~~~~~: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9 :2691 | note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here i2805f | ( i t ! = bmluolc_kmIadtx_.qx_ s|t|r ejatm _!k=_ fbilxoucpk' requested heree ed_che c2813k | > < < < b l o c km_unlu_mmsa_tx_yq__tsitlrienagm,_ kb_lfoicxku_pdM>Q>_ N W| A ^R PS,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :n2897e:e13d:_ cnote: hin instantiation of function template specialization 'launch_mul_mat_q' requested heree ck> <2897< | < b l o c k _ n u m s _ xlya_utniclhi_nmgu,l _bmlaotc_kq_t(rcetaxm,> >a>r g s| , ^ str/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhe:a2870m:)13;: note: | in instantiation of function template specialization 'launch_mul_mat_q' requested here ^ 2870/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh | : 2691 : 16 : warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] l2691a | u n c h _ m u l _imfa t(_iqt< t!y=p eb,l o c5k6I>d(xc.txx ,| |a rjgts ,! =s tbrleoacmk)I;d x .| y ^) { | ~~ ^ ~~~~~~~~~~/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ dx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1151. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<>>(vx, vy, dst, ncols_x/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ , nrows_x, nrows_y/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ , nrows_dst); /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ 866 | const int * __restrict__ x, const int * __re/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ strict__ y, f/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ l/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ oat * __re/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ strict__ sum, const int /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu&:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ k00) { | ^/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. 293 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<< > > | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh: b2876r:e13a:k ;note: in instantiation of function template specialization 'launch_mul_mat_q' requested here | ^~~~~ 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 293 warnings generated when compiling for gfx908. 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuvo:i126d: 98m: mawarning: _comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare]K 8(con s126t | m m a _ i nitf_ A(_tIh1r6eKa8d Id&x .xm m' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhds:t1053,: 99n:c owarning: lunused parameter 'k00' [-Wunused-parameter]s _x, nrows _1053x | , n r o wcso_nys,t nirnotws _*ds __tr)e; s t| ^r ic/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:t321_:_ 5x:, cnote: oin instantiation of function template specialization 'mul_mat_vec_q_cuda' requested heren st 321in | t * __ rmeuls_mtarti_cvte_c__ qy_,c ufdlao (svuxm,, vcyo,n sdts t,i nncto l&s _kx0,0) n{r o ws| ^_ x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuin:t126 :&98 :s warning: tcomparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare]r ide11, c126o | n s t i n t i&f n(eth0r,e a d| I ^dx .x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 293 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ 78 warnings generated when compiling for gfx1152. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 293 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1200. 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ : warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h_:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ _device__ __forc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ einline__ void mma_K4(c/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ onst mma_int_A_I1/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h6:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ K4 & mma_A,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ ream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 293 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:57:34: warning: unused parameter 'nrows_x' [-Wunused-parameter] 57 | const int ncols_x, const int nrows_x, const int nrows_y, const int nrows_dst) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:418:13: warning: 'break' will never be executed [-Wunreachable-code-break] 418 | break; | ^~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:209:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 209 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:216:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 216 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:223:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 223 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:230:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 230 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:237:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 237 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:244:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 244 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:251:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 251 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ 78 warnings generated when compiling for gfx1201. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:258:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 258 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:265:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 265 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:272:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 272 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:279:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 279 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:286:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 286 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:293:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 293 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:300:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 300 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:307:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 307 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:314:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 314 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:321:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 321 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:328:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 328 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:176:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 176 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:179:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 179 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:182:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 182 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:185:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 185 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:188:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 188 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:191:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 191 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:194:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 194 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:80:48: warning: suggest braces around initialization of subobject [-Wmissing-braces] 80 | float tmp[ncols_y][rows_per_cuda_block] = {0.0f}; | ^~~~ | { } /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:197:13: note: in instantiation of function template specialization 'mul_mat_vec_q' requested here 197 | mul_mat_vec_q<<>>(vx, vy, dst, ncols_x, nrows_x, nrows_y, nrows_dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:335:5: note: in instantiation of function template specialization 'mul_mat_vec_q_cuda' requested here 335 | mul_mat_vec_q_cuda(vx, vy, dst, ncols_x, nrows_x, nrows_y, ncols_y, nrows_dst, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/mmvq.cu:126:98: warning: comparison of integers of different signs: 'unsigned int' and 'const int' [-Wsign-compare] 126 | if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) { | ~~~~~~~~~~~~~~~~~~ ^ ~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 293 warnings generated when compiling for host. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ [ 58%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1200. 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ :2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ launch_mul_mat_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ q(ctx, ar/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ gs, stream); /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx900. 78 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 8(const mma_int_A_I16K8 & mma_A, const mm/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ a_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mIn file included from at_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, co/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ nst int & stride11, const int & ne0, /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx900. 78 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ if (it /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ != blockIdx.x || jt != /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hb:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ lockIdx.y) { /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ :298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1012. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1201. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx900. 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1201. 78 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx906. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhs:t2691r:36id:e 0warning: 1comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare], con 2691s | t i n t & nief1 0,( icot ns!t= bilntoc k&Id nxe1.1x, c|o|n sjtt i!nt= &bl sotcrkiIddxe.1y1), { c o| n ~~ ^ ~~~~~~~~~~s t i/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhn:t2813 &: 9ne: 0note: ,in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here | ^ 2813 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh : 2497 :75 : warning: munused parameter 'ne10' [-Wunused-parameter]ul _ma t2497_ | q _ s tcronesat mi_nkt_ fi& xnue0p0<,t ycpoen,s t minmt q_&x, nMMeQ0_1,N cWoAnRPstS ,i nente &d_ cshtecrki>d i>n>t &| ^ s tr/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhid:e28731:1,13 c:on stnote: iin instantiation of function template specialization 'launch_mul_mat_q' requested heren t 2873& | ne 0 , | ^ launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1100. 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. 78 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq1_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1101. 78 warnings generated when compiling for gfx90a. 78 warnings generated when compiling for host. [ 59%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q2_k.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q2_k.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q2_k.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q2_k.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdxIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ .y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != bloIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ ckIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_f/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhi:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ xup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. 78 warnings generated when compiling for gfx942. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] 1022 | for (int k01 = 0; k01 < WARP_SIZE; k01 += QR2_K*VDR_Q2_K_Q8_1_MMQ) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] 78 warnings generated when compiling for gfx90a. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | In file included from launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_str/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhe:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ am_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt !=/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for host. [ 59%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q3_k.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q3_k.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q3_k.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q3_k.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. 78 warnings generated when compiling for host. [ 60%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_0.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_0.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_0.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_0.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 98 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for host. [ 61%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_1.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_1.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_1.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_1.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for host. [ 62%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_k.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_k.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_k.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_k.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq3_s.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for host. [ 63%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_0.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_0.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_0.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_0.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu 78 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh):1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ ; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for host. [ 63%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_1.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_1.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_1.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_1.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu 78 warnings generated when compiling for gfx1012. 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1152. 78 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1100. 78 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y)In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) {78 warnings generated when compiling for gfx1030. | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1030. 78 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1101. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * _/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ _restrict__ sum, const int & k00) {/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ct/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ x, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ype, 128>(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ :2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ launch_mul_mat_q(ctx, args,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | 78 warnings generated when compiling for gfx1102. ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1031. 78 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. 78 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ 2894 | la/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ unch_mul_mat_q(ctx, args, stream/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ ); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h :281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1201. 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ :192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh warning:s2691 generated: when compiling for 36gfx1100:. warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1151. 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ 78 warnings generated when compiling for gfx900. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1031. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_In file included from q/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ (ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y)/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh::2691172::36105:: warning: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 2691 | 172 | i f ( i t_ _!d=e vibcleo_ck_I _d_xf.oxr c|e|i njlti n!e=_ _b lvoocikdI dmxm.ay_)K 4{( c o| n ~~ ^ ~~~~~~~~~~s t mma_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhi:n2813t:_9A_:I 1note: 6in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested hereK 4 & mma _2813A | , co n s t m mam_uiln_tm_aBt__Jq8_Ks4t r&e ammm_ak__Bf)i x{u p <| t ^y pe, mmq_x, MMQ_NWARPS, need_check><<> _>_f or c| ei ^n li/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhn:2873e:13_: _ note: voin instantiation of function template specialization 'launch_mul_mat_q' requested herei d m2873m | a_ K 8 ( co ns t m m a l_aiunntch_A__Im1u6Kl8_ m&a t_mqi(nct_tB_xJ8, Ka8rg s&, smmtar_eB)a m){; | ^| ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | 866 ^ | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :2879 :co13n:s tnote: in instantiation of function template specialization 'launch_mul_mat_q' requested here in t2879 | * _ _ r e s t ri ct _l_a xu,n cch_omnsult _imnatt_ q*< t__yrpeest,r i8ct0>_(c_tx , ya,r gfs,l sotareta m*); _ _ r| e ^s tri/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhc:t_2691:_16 :s uwarning: mcomparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare], co ns2691t | in t & k 0i0)f ({i t | ! ^= blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1101. 78 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup:< >> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx906. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1152. 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != b/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ lockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x ||/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ mul_mat_q(ctx, args, stream); /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ | if (it != blockIdx.x || jt != /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. 78 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx78 warnings generated when compiling for gfx1200. .y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for host. [ 64%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_k.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_k.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_k.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_k.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx900. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx906. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh| : ^2691 :36:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :warning: 2497:comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]75 : warning: unused parameter 'ne10' [-Wunused-parameter] 2691 | 2497 | icofn s(tit i n!t= &bl noeck00I,dx .coxn |s|t ijnt &t !ne=0 b1l, occkoInsdtx .iyn)t { & s| t ~~ ^ ~~~~~~~~~~r ide01/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh,: 2805c:o9:n st innote: tin instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here & ne10, 2805c | o n s t i n t m&u ln_em1a1t,_ qc_osntsrte aimn_tk _&f isxturpi<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx906. 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. 78 warnings generated when compiling for gfx1201. 78 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1031. 78 warnings generated when compiling for gfx900. 78 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, con/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ st int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ , const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ dims, 0, stream>>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ need_check><<' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ block_dims, 0, stream>>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != block/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ Idx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ _mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ MMQ_NWARPS, need_check><<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 2691 | if (it != blockIdx.x /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh|:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ | jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: ,warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ : warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q3_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for host. [ 65%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q6_k.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q6_k.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q6_k.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q6_k.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. 78 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhK8:(2821c:o15:ns twarning: unused variable 'nsm' [-Wunused-variable]m ma_int _2821A | _ I 1 6 Kc8o n&s tm mian_tA ,n scmo n s t= mgmgam_li_nctu_dBa__Ji8nKf8o (&) .mdmeav_iBc)e s{[ i d| ] ^. nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<< > > | i ^f (it/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :!2867=: 13b:l onote: cin instantiation of function template specialization 'launch_mul_mat_q' requested herek Idx. x2867 | | | j t ! = b l olacukncIhd_mxu.ly_)m a{t _ q| < ~~ ^ ~~~~~~~~~~t ype, 48>(ctx,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :2805a:r9gs:, snote: tin instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested herer eam) ;2805 | | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh: 2691m:u16:l _warning: mcomparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] at_ 2691q | _s t r e a mi_fk _(fiitxu p!<=ty bploec,kI dmxm.qx_ x|,| jMtM Q!_=N WbAlRoPcS,k Idnx.eye)d _{ c h| e ~~ ^ ~~~~~~~~~~ ck><<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<< >> | ^ i/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhf: 2867(:i13t: !note: =in instantiation of function template specialization 'launch_mul_mat_q' requested here bloc k2867I | d x . x | | j t ! =l abulnocchk_Imduxl._ym)a t{_ q <| t ~~ ^ ~~~~~~~~~~y pe, 4/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh8:>(2813c:t9x,: a rnote: gin instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested heres , st r2813e | am ) ; | ^ mu/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhl:_m2691a:16t:_ warning: qcomparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]_ st r2691 | ea m _ k _ f i x upif< (tity !pe=, mbmloqc_kIxd,x. xM |M|Q j_Nt W!A= RblPocSk,I dnexe.yd) _{c h e| ~~ ^ ~~~~~~~~~~c k><<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh::362691:: 36warning: :comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | 2691 | i fi f( i(ti t! =! =b lbolcokIcdkxI.dxx .|x| |j|t j!t= !b=l obclkoIcdkxI.dyx). y{) {| ~~ ^ ~~~~~~~~~~ | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh::92813:: 9note: :in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | 2813 | mu l_ mmatu_lq__msatrte_aqm__ks_tfrixeuapWit>i>l i ng| , ^ b/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhl:2873oc:13k:_ dnote: imin instantiation of function template specialization 'launch_mul_mat_q' requested heres , 02873, | s tr e a m >l>au>n c h| _ ^mu l_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhma:t2858_q:' requested here4> (ct x2858, | a rg s, s t re a m) ; | ^l au/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhn:c2691h:_16mu: lwarning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]_m at _2691q | < t yp e ,i f 2(i4t >!=(c tbx,lo ckarIdgsx,. x s|t|r jeta m!)= ;b lo ck| ^Id x./builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhy:)2691 {: 16 :| ~~ ^ ~~~~~~~~~~ warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. 78 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for host. [ 66%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q8_0.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q8_0.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q8_0.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q8_0.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ 78 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1030. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ 78 warnings generated when compiling for host. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ [ 67%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & strid/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhe:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_1.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 78 warnings generated when compiling for gfx1103. 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for host. [ 68%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1100. 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h0 :=192 :09;: warning: kanonymous types declared in an anonymous union are an extension [-Wnested-anon-types]_ KQ_0 <192 | D / s i z eo f(sitnrut)c;t {k_ KQ| _ ^ 0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_fla/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hsh:_213a:t9t:n _warning: eanonymous types declared in an anonymous union are an extension [-Wnested-anon-types]x t_ve c213_ | f 1 6 _ c a s e _sitmrpulc(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for host. [ 68%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_at/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ tn_ext_vec_f16_case_impl' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ock, parallel_blocks, type_K, type_V, use_logit_softcap>(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kern/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhe:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ l = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 142 | for (int i0 = 0; i0 < D//builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhs:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ izeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh<:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ D, parallel_blocks> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ :116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | fo/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ r (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/si/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ zeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1031. 60 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x ||/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h j:t 213!:=9 :b lwarning: oanonymous types declared in an anonymous union are an extension [-Wnested-anon-types]c kId x213 | . y ) { | ~~ ^ ~~~~~~~~~~ s tru/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhc:t2813 :9{: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here| ^ 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1102. 60 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARIn file included from P/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ _SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx1103. 60 warnings generated when compiling for gfx1030. 78 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ , const mma_int_B_J8K4 & m/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ ma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ 13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ lock, parallel_blocks, type_K, type_V, us/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ e_logit_softcap>(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ r_block, parallel_blocks, type_K, type_V/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ , use_logit_softcap>(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 196 | for (int k_KQ_0 = 0; k_KQ_0 /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ ock, parallel_blocks, type_K, type_V, use_logit_softcap>(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ :2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ at_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 2867 | launch_mul_mat_q(ctx, args, streIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ am); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ _cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ :2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kerne/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ l = flash_attn_vec_ext_f16' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ _block, parallel_blocks, type_K, type_V, use_logit_softcap>; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_ma/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ t_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl' requested here 2805 | mul_mat_q_stream_k_fixup<<(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ , 0, stream>>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 303 | fattn_kernel_t fattn_kernel = fl/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuha:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ sh_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1031. 60 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ p>; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ l_blocks, type_K, type_V, use_logit_softcap>(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeoIn file included from f/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ (int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ 60 warnings generated when compiling for gfx1151. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ 78 warnings generated when compiling for gfx1100. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ 78 warnings generated when compiling for gfx1100. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 60 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx1100. 60 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. 60 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1151. 60 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_qIn file included from _st/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cur:eam_k_f3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:ix21:u19:p <| < ^ ^> > /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh :| 25 ^: 19:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :2852warning: :unused parameter 'ne10' [-Wunused-parameter]13 : 25note: | in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | co n s t i n tl anuen1c0h,_ m | u ^l _m/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhat:_28q:19<:t ywarning: peunused parameter 'ne13' [-Wunused-parameter] , 28 | 8 > ( c t x , caorgnss,t sitnrte anme)1;3 , | ^| ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh29::192691:: 16warning: :unused parameter 'ne31' [-Wunused-parameter] warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 29 | 2691 | c o n s t iifn t( inte 3!1=, b l| o ^c kI/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhd:x30.:x19 :| |warning: unused parameter 'nb31' [-Wunused-parameter]j t !30= | bl o c k I d x .cyo)n s{t i| n ~~ ^ ~~~~~~~~~~t nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhgg:m2691l:_36cu:d awarning: _comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]f lash _2691a | t t n _ ex t _ivfe c(_ift1 6!_=c absleo_cikmIpdlx<.Dx, c|o| ljst_ p!e=r _bblloocckkI, dpxa.rya)l {l e l| _ ~~ ^ ~~~~~~~~~~ blo/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhc:k2805s:9,: tnote: yin instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested herep e_K ,2805 | t yp e _ V , u smuel__lmoagti_tq_s_osfttrceaam_pk>_(ficxutpx >ZE> ) { | ^| ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx1151. 60 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx1103. 60 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ 60 warnings generated when compiling for gfx1200. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1201. 60 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh warning: :comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare]554 :24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 196 | 554 | f o r ( i n*t( (ku_iKQn_t03 =2 _0t ;* )k _&KKQQ_0 _' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh= :fl116a:s37h:_ atwarning: tcomparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare]n _vec_ext_f1 6116< | D , c o l s _ p e r _ b l o c kf,o rp a(rianltl eil0_ b=l o0c;k si,0 tE); { | | ~~ ^ ~~~~~~~~~~~~~ ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh13::303 :note: 35in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here : note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | 303 | f a t tgng_mkle_rcnuedla__tf lfaastht_na_tktenr_neexlt _=v efcl_afs1h6__actatsne__viemcp_le(scotfxt,c apd>s;t ) ;| ^ | ^/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh :369:13/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:: note: 142in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here: 33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare]369 | 142 | g g ml _ c ufdoar_ f(ilnats hi_0 a= t0t;n _eix0t _(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh1;: 116l :<37 :s iwarning: zecomparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare]o f(int); ++l) { 116 | | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh : 341 : 27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare]f or 341 | (i nt i 0 = 0f;or (iin0t ' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhnote: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here: 129:33: warning: 306 | comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] launch_f a129tt | n t( cit0x ,= d0s;t ,i 0f a' requested here_V ); | ^ 303 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh : 381 : 9f:a tnote: tin instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested heren _kernel_ t381 | fa t t n _ k e rnel g=g mfll_acsuhd_aa_tftlna_svhe_ca_tetxnt__efx1t6__;l o g| i ^t _softc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuha:p333>:(13c:t xnote: ,in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here dst); | ^333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1102. 60 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 60 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for host. [ 69%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx1151. 60 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f3219;: warning: | unused parameter 'ne00' [-Wunused-parameter] ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308: 1321: | note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here co n308s | t i n t n e 0 0 , g| g ^m l_cu/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhd:a24_:f19l:a swarning: hunused parameter 'ne03' [-Wunused-parameter]_ att n24_ | e x t _ v e c _ fc3o2n_scta sien_ti mpnle<0D3,, c o| l ^s _/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhp:e25r:_19b:l owarning: unused parameter 'ne10' [-Wunused-parameter]c k ,25 | p a r a l l e lc_obnlsotc kisn,t tnyep1e0_,K , | t ^y pe/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh_:V28,: 19u:s ewarning: _unused parameter 'ne13' [-Wunused-parameter]l og i28t | _ s o f t c a p >c(ocntsxt, idnstt )n;e 1 3| , ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx1152. /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:333:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 333 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:343:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 343 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:346:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 346 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:356:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 356 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:359:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:369:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 369 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:372:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 372 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:384:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 384 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx1031. 60 warnings generated when compiling for host. [ 70%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { In file included from | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ :116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuhwarning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ :116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh :563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1150. 34 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh :563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx906. 34 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | gIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ gml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIIn file included from Z/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ E) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 34 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 34 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx1101. 34 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 34 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx1102. 78 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 34 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 34 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 34 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx1200. 60 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q4_0, GGML_TYPE_Q4_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 60 warnings generated when compiling for host. [ 71%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1150. 60 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 34 warnings generated when compiling for gfx1151. 34 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 34 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1200. 60 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl (+c= tx,W AdsRtP)_;S I ZE| ) ^{ | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZIn file included from E/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu): {3 : In file included from | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh ~~ ^ ~~~~~~~~~~~~~:2 : /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh65::28433::35 :warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare]note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 65 | 284 | f o rf a(titnnt_ kke_rKnQe_l0_ t= f0a;t tkn__KkQe_r0n e' requested herel ocks, 479t | yp e _ K ,r ettyupre_nV ,t yupsee__Kl o=g=i tG_GsMoLf_tTcYaPpE>_;Q 4 _| 0 ^ ? ve/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuhc:_334d:o13t:_ fnote: ain instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested heret tn_vec_ K334Q | _ q 4 _ 0 < h a l f , Dg>g m:l _ c| u ^d a_fl/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhas:h303_:a35t:t nnote: _in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here ext_ ve303c | _ f 32 _ cafsaet_timnp_lk_(pcetrx_, bdlsotc);k , | p ^a ral/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuhl:e129l:_33b:l owarning: ccomparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare]k s, t129y | p e _ K , t yp e_ V, u sfeo_logrit (int_so iftc0 a=p >0;; i| 0 < ^ D/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:/330s:i13ze:o fnote: (in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested herei nt) ;330 | i0 + = W A R P _ SI Z Eg) g{m l _| c ~~ ^ ~~~~~~~~~~~~~ud a_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:f142la:s33h:_ awarning: tcomparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare]t n_e x142 | t _ v e c _ f 1 6 _ c afsoe_ri m(pil(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx1200. 78 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1200. 34 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 78 warnings generated when compiling for gfx1152. 34 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, c/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hon:st192 :in9t: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]* _ _192r | e s t ri c t __s tyr,u cft l{ oa| t ^* __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:196::269133::36 :warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare]warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 196 | 2691 | f o r ( iinft (ki_tK Q!_=0 b=l o0c;k Ikd_xK.Qx_ 0| |< jDt/ s!i=z ebolfo(ciknItd)x;. yk)_ K{Q _ 0| ~~ ^ ~~~~~~~~~~+ = WARP/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh_:S2805I:Z9E:) note: {in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here | ~~~~~~ ^ ~~~~~~~~~~~~~ 2805 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh : 482 : 36 : note: min instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested hereul _mat_ q482_ | s t r e a m _ k _tfyipxeu_pK< t=y=p eG,G MmmLq__TxY,PE _QM5M_Q1_NW A?R PvSe,c _nedeod_tc_hfeactkt>n<_b l:o ck _| d ^i ms/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh,: 303:350:, note: sin instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested heret ream >303> | > | fatt ^n _/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhk:e2873rne:l_13t: fnote: atin instantiation of function template specialization 'launch_mul_mat_q' requested heret n_k e2873r | n e l = f la s hl_aatutnnc_hve_cm_uel_xmta_ft1_6q<k(,c tpxa,r aalrlgesl,_ blsotcrkeasm,) ;t y p| e ^_ K,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :t2691y:p16e:_ Vwarning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare], u s2691e | _lo g i t _ s o f itfc a(pi>t !; = b| ^l oc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhk:I330d:x13.:x | |note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested herej t != 330 | b loc k Id x . y )g g{m l _| cu ~~ ^ ~~~~~~~~~~d a_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_v/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhe:c_2691K:36Q: _warning: qcomparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]4 _0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhi:f303 :(35i:t note: !in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here= b loc kI303d | x . x |f|a jttt n!_=k ebrlneolc_ktI dfxa.tyt)n _k{e rn | ~~ ^ ~~~~~~~~~~e l =/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :f2805:l9a: note: sin instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested hereh _at t2805n | _v e c _ e xmtu_lf1_6m_y;_ t i| l ^i ng/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh,: 330b:l13oc:k _note: din instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested herei ms, 3300 | , s t re a m > > > g| g ^m l_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhc:2876u:d13a:_ note: fin instantiation of function template specialization 'launch_mul_mat_q' requested herel a s2876h | _ a t t n _ e x t _ v elca_fu1n6c_cahs_em_uilm_pmlap(ecrt_xb,l oarcgk,s , sptarreaalm);l e l| _ ^b locks,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :2691t:yp16e:_ warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]K, typ e2691_ | V, u s e _ l o giit_sofft c(aip>t( c!t=x, bldoscktI)dx.;x || | ^j t != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh3:: 2813In file included from :/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh9::2 : note: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhin instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here: 318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare]2813 | 318m | u l _ m afto_rq _(sitnrte alm _=k _0f;i xlu p<< tsyipzee,o fm(miqn_tx, MM)Q;_ NW+A+RlP)S {, n ee| d_ ~ ^ ~~~~~~~~~~~c hec/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhk:>130<:<<17:b lonote: cin instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested herek _num s_130 | x y_ t il i ng , b l oc k _di mqusa, n0t,i zset_rqe8_a1m_>t>o>_ sha r| e ^d note: (in instantiation of function template specialization 'launch_mul_mat_q' requested here Q_ f 2876+ | 4 * i 0 , sc a llaeu, tmncph__qm_uli_3ma2,t _tqm| ( ^c tx,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh :a303r:g35s,: note: sin instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested heret rea 303 | m ) ; f| a ^t tn/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh_:ke2691r:n16: ewarning: lcomparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]_ t f2691a | t t n _ k e rinfel (=i tf l!a=sh _bloactktInd_xv.exc _|ext_f|1 6j; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 34 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 34 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 78 warnings generated when compiling for gfx900. 34 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 34 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args,/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h :192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ if (it != blockIdx./builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ x || jt != bl/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.ho:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ ckIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K =/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h= :G192G:M9L:_ Twarning: Yanonymous types declared in an anonymous union are an extension [-Wnested-anon-types]P E_Q4 _1920 | ? v e c _ d ots_trfuacttt n{_ v e| c_KQ ^ _q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst)/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h;: 213: 9| : ^ warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0;/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h l: 281<: 9s:i zwarning: eanonymous types declared in an anonymous union are an extension [-Wnested-anon-types]o f(in t281) | ; + + l ) { s t| r ~ ^ ~~~~~~~~~~~u ct { /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh| : ^130 :17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cud/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.ha:_f298l:a9s:h _warning: aanonymous types declared in an anonymous union are an extension [-Wnested-anon-types]t tn _298e | xt _ v e c _ f1 6str_uccatse _{i m p| l ^ (ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 60 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 34 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 128>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 128>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 128>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 128>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 128>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for host. [ 72%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu 34 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_re/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hsu:l192t:s9<:D ,warning: panonymous types declared in an anonymous union are an extension [-Wnested-anon-types]a rall e192l | _b l oc k s > | ^s tr/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhu:c306t: {5 :| note: ^in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx906. 34 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 34 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 34 warnings generated when compiling for gfx1150. 34 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 34 warnings generated when compiling for gfx1031. 60 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 34 warnings generated when compiling for gfx1151. 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 34 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 60 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:311:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 311 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:321:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 321 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:324:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 2, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 324 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:334:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 334 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:337:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 4, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 337 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:347:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 347 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:350:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 4, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 350 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:116:37: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 116 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:362:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_Q8_0, GGML_TYPE_Q8_0, true>' requested here 362 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:129:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 129 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:142:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 142 | for (int i0 = 0; i0 < D/sizeof(int); i0 += WARP_SIZE) { | ~~ ^ ~~~~~~~~~~~~~ 34 warnings generated when compiling for gfx1152. 60 warnings generated when compiling for host. [ 72%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu 34 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx90a. 34 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<</builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ >> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh :563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x ||In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ , mmq_x, MMQ_NWARPS, need_check><<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ :2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx908. 34 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | strIn file included from uc/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cut: 3{: In file included from | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh ^: 1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h s:t254r:9u: cwarning: t anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]{ | 254 ^ | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct {/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h : | 281 ^: 9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h | : 298 : 9 : warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]s tr u298c | t { | ^ s truct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu<:<3<: bIn file included from l/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuho:c2k: _/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhn:u149m:s33_:x ywarning: _comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare]t iling, bl o149c | k _ d i mfso,r 0(,i nstt rke_aKmQ>_>0> = | 0 ^; k_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhK:Q2864_:013 :< note: Din instantiation of function template specialization 'launch_mul_mat_q' requested here/ size o2864f | ( i n t ) ; k _ K Q _ 0l a+u=n cWhAR_mPu_SlI_ZmEa)t {_q < | t ~~~~~~ ^ ~~~~~~~~~~~~~y pe/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh,: 481 :436:0 >(note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested herec tx, 481a | r g s, s tr e a mty);p e_ K| ^= = GG/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhM:L2691_:16TY:P Ewarning: _comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare]Q 5_0 2691? | v ec _ d o tif_ fa(titt n!_=v ebcl_oKcQ_kqI5d_x0. !=: bl o| c ^ kId/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhx.:y303): 35{ : note: | in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here ~~ ^ ~~~~~~~~~~ 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1201. 34 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx90a. 34 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhanonymous types declared in an anonymous union are an extension [-Wnested-anon-types] :2691:36: warning: 171comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] | 2691 | s tr uicft ({i t | ! ^= blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q254(:c9t:x ,warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]a rgs, 254s | t r e a m ) ; st r| u ^c t { /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh :2691| : ^16 : warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx1201. 34 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it !=In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fIn file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ ixup<<>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ ck_nums_xy_tiling, block_dims, 0, stream>>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockI/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ dx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 34 warnings generated when compiling for gfx1152. 34 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1031. 78 warnings generated when compiling for gfx90a. 34 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 34 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx900. 34 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: In file included from anonymous types declared in an anonymous union are an extension [-Wnested-anon-types]/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ 213 | st/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ ruct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ 9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ block_dims, 0, stream>>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: In file included from warning: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ mul_mat_q_stream_k_fixup' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ need_check><<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 34 warnings generated when compiling for gfx1101. 34 warnings generated when compiling for gfx90a. 34 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(c/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhtx:, 554ds:t24,: fwarning: acast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual]tt n_kerne l554, | nw a rp s , c o*l(s(_upienrt_3b2l_octk ,* )ne ed&_KfQ1_6_maKx_,sc anleee)d _&f1= 6f_tVz);_ m| ^a sk/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh;: 330 :| 13 ^ : note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 256>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 256>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 256>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 256>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_comIn file included from bi/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cun:e3_: rIn file included from e/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhsu:l2t: s/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh<:D65,:33 :p awarning: rcomparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare]a llel_block s65> | | ^ fo/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuhr: 306(:i5n:t note: kin instantiation of function template specialization 'launch_fattn<64, 1>' requested here_KQ _0 = 0306 | ; k _ KQl_a0u n( ctWx, AdRPs_SIZtE,) f{a t t| n ~~~~~~ ^ ~~~~~~~~~~~~~_ kern/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuhe:l479, :n39w:a rnote: pin instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 256>' requested heres , cols_pe r479_ | b l o rcekt,u rnne edt_ypfe1_6K_ K=,= nGeGeMdL__TfY16P_EV_)Q;4 _| 0 ^ ? vec/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:_381d:o9t:_ fnote: atin instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested heretn _vec 381_ | K Q _ q 4 _ 0 < hgaglmfl,_c udD>a _:f l a| s ^h _a/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuht:t303n:_35e:x tnote: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here_ vec _303f | 1 6 _ c afsaet_tinm_pklec(kcst,x ,t dyspte)_;K ,| ^ type_V, use_logit_softcap>; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for host. [ 73%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q8_0.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 34 warnings generated when compiling for gfx1102. 78 warnings generated when compiling for host. [ 74%] Building CXX object ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/hipcc -DGGML_BACKEND_BUILD -DGGML_BACKEND_SHARED -DGGML_HIP_NO_VMM -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_HIP -DUSE_PROF_API=1 -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -D__HIP_PLATFORM_AMD__=1 -Dggml_hip_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/.. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 -MD -MT ggml/src/ggml-hip/CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu.o -MF CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu.o.d -o CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx942. 34 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:483:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0<__half, 64>' requested here 483 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:482:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1<__half, 64>' requested here 482 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:481:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0<__half, 64>' requested here 481 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:480:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1<__half, 64>' requested here 480 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:479:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0<__half, 64>' requested here 479 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared<__half2>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:303:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f16<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 303 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f16; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:330:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 330 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:306:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 306 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f16.cuh:381:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f16_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 381 | ggml_cuda_flash_attn_ext_vec_f16_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for host. 34 warnings generated when compiling for gfx1010. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx906. 34 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1012. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1031. 34 warnings generated when compiling for gfx1030. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(icztx,e dosft();i n t| ) ^; ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1035. 34 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx1201. 34 warnings generated when compiling for gfx1031. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ launch_mul_/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.hm:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ at_q(ctx/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h,:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ :254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuhstruct { | ^ :2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ :281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx908. 34 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1101. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1035. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] 1022 | for (int k01 = 0; k01 < WARP_SIZE; k01 += QR2_K*VDR_Q2_K_Q8_1_MMQ) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1022:5: warning: loop not unrolled: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering [-Wpass-failed=transform-warning] 34 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1201. 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q5_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for host. 34 warnings generated when compiling for gfx1101. 34 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 34 warnings generated when compiling for gfx900. 34 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1102. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1103. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx900. 34 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1150. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __fo34r warnings generated when compiling for gfx908. ceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 34 warnings generated when compiling for gfx1151. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 34 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1152. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ 34 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<64, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<64, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<64, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for host. 98 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 34 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<128, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<128, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<128, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for host. 34 warnings generated when compiling for gfx1200. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx1201. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 34 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q6_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for host. 34 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 34 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 34 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 78 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 34 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:1: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:563:47: warning: function 'on_no_fattn_vec_case' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 563 | static void on_no_fattn_vec_case(const int D) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:21:19: warning: unused parameter 'ne00' [-Wunused-parameter] 21 | const int ne00, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:24:19: warning: unused parameter 'ne03' [-Wunused-parameter] 24 | const int ne03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:25:19: warning: unused parameter 'ne10' [-Wunused-parameter] 25 | const int ne10, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:28:19: warning: unused parameter 'ne13' [-Wunused-parameter] 28 | const int ne13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:29:19: warning: unused parameter 'ne31' [-Wunused-parameter] 29 | const int ne31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:30:19: warning: unused parameter 'nb31' [-Wunused-parameter] 30 | const int nb31, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:33:19: warning: unused parameter 'nb03' [-Wunused-parameter] 33 | const int nb03, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:36:19: warning: unused parameter 'nb13' [-Wunused-parameter] 36 | const int nb13, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:39:19: warning: unused parameter 'nb23' [-Wunused-parameter] 39 | const int nb23, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:40:19: warning: unused parameter 'ne0' [-Wunused-parameter] 40 | const int ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:41:19: warning: unused parameter 'ne1' [-Wunused-parameter] 41 | const int ne1, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:42:19: warning: unused parameter 'ne2' [-Wunused-parameter] 42 | const int ne2, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:43:19: warning: unused parameter 'ne3' [-Wunused-parameter] 43 | const int ne3) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:247:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 247 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:494:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q8_0' requested here 494 | type_K == GGML_TYPE_Q8_0 ? vec_dot_fattn_vec_KQ_q8_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:196:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 196 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:493:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_1' requested here 493 | type_K == GGML_TYPE_Q5_1 ? vec_dot_fattn_vec_KQ_q5_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:149:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 149 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:492:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q5_0' requested here 492 | type_K == GGML_TYPE_Q5_0 ? vec_dot_fattn_vec_KQ_q5_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:105:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 105 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:491:36: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_1' requested here 491 | type_K == GGML_TYPE_Q4_1 ? vec_dot_fattn_vec_KQ_q4_1 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:65:33: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 65 | for (int k_KQ_0 = 0; k_KQ_0 < D/sizeof(int); k_KQ_0 += WARP_SIZE) { | ~~~~~~ ^ ~~~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:490:39: note: in instantiation of function template specialization 'vec_dot_fattn_vec_KQ_q4_0' requested here 490 | return type_K == GGML_TYPE_Q4_0 ? vec_dot_fattn_vec_KQ_q4_0 : | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:318:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 318 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:130:17: note: in instantiation of function template specialization 'quantize_q8_1_to_shared>' requested here 130 | quantize_q8_1_to_shared(Q_f + 4*i0, scale, tmp_q_i32, tmp_q_ds); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:284:35: note: in instantiation of function template specialization 'flash_attn_vec_ext_f32<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 284 | fattn_kernel_t fattn_kernel = flash_attn_vec_ext_f32; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:325:23: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 325 | for (int l = 1; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:341:27: warning: comparison of integers of different signs: 'int' and 'unsigned long' [-Wsign-compare] 341 | for (int l = 0; l < sizeof(int); ++l) { | ~ ^ ~~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 4>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 4>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:308:13: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 1, 4, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 308 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:2: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:554:24: warning: cast from 'const float *' to 'unsigned int *' drops const qualifier [-Wcast-qual] 554 | *((uint32_t *) &KQ_max_scale) &= ftz_mask; | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-common.cuh:704:5: note: in instantiation of function template specialization 'flash_attn_combine_results<256, 1>' requested here 704 | flash_attn_combine_results | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:287:5: note: in instantiation of function template specialization 'launch_fattn<256, 1>' requested here 287 | launch_fattn(ctx, dst, fattn_kernel, nwarps, cols_per_block, need_f16_K, need_f16_V); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../fattn-vec-f32.cuh:359:9: note: in instantiation of function template specialization 'ggml_cuda_flash_attn_ext_vec_f32_case_impl<256, 8, 1, GGML_TYPE_F16, GGML_TYPE_F16, false>' requested here 359 | ggml_cuda_flash_attn_ext_vec_f32_case_impl(ctx, dst); | ^ 34 warnings generated when compiling for host. 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q4_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for host. 78 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../common.cuh:20: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:171:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 171 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:192:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 192 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:213:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 213 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:254:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 254 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:281:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 281 | struct { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-hip/../ggml-common.h:298:9: warning: anonymous types declared in an anonymous union are an extension [-Wnested-anon-types] 298 | struct { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:5: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:172:105: warning: function 'mma_K4' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 172 | __device__ __forceinline__ void mma_K4(const mma_int_A_I16K4 & mma_A, const mma_int_B_J8K4 & mma_B) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mma.cuh:194:105: warning: function 'mma_K8' could be declared with attribute 'noreturn' [-Wmissing-noreturn] 194 | __device__ __forceinline__ void mma_K8(const mma_int_A_I16K8 & mma_A, const mma_int_B_J8K8 & mma_B) { | ^ In file included from /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/mmq-instance-q2_k.cu:3: /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:866:99: warning: unused parameter 'k00' [-Wunused-parameter] 866 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1053:99: warning: unused parameter 'k00' [-Wunused-parameter] 1053 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:1704:99: warning: unused parameter 'k00' [-Wunused-parameter] 1704 | const int * __restrict__ x, const int * __restrict__ y, float * __restrict__ sum, const int & k00) { | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:17: warning: unused parameter 'ne00' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2497:75: warning: unused parameter 'ne10' [-Wunused-parameter] 2497 | const int & ne00, const int & ne01, const int & stride01, const int & ne10, const int & ne11, const int & stride11, const int & ne0, | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2821:15: warning: unused variable 'nsm' [-Wunused-variable] 2821 | const int nsm = ggml_cuda_info().devices[id].nsm; | ^~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2852:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2852 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2855:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2855 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2858:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2858 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2861:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2861 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2864:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2864 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2867:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2867 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2870:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2870 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2873:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2873 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2876:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2876 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2879:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2879 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2882:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2882 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2885:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2885 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2888:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2888 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2891:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2891 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2894:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2894 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2805:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2805 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:36: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2813:9: note: in instantiation of function template specialization 'mul_mat_q_stream_k_fixup' requested here 2813 | mul_mat_q_stream_k_fixup<<>> | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2897:13: note: in instantiation of function template specialization 'launch_mul_mat_q' requested here 2897 | launch_mul_mat_q(ctx, args, stream); | ^ /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-cuda/template-instances/../mmq.cuh:2691:16: warning: comparison of integers of different signs: 'const int' and 'unsigned int' [-Wsign-compare] 2691 | if (it != blockIdx.x || jt != blockIdx.y) { | ~~ ^ ~~~~~~~~~~ 78 warnings generated when compiling for host. [ 75%] Linking CXX shared library ../../../bin/libggml-hip.so cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/cmake -E cmake_link_script CMakeFiles/ggml-hip.dir/link.txt --verbose=1 /usr/bin/hipcc -fPIC -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -Xlinker --dependency-file=CMakeFiles/ggml-hip.dir/link.d -Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes -shared -Wl,-soname,libggml-hip.so.b4580 -o ../../../bin/libggml-hip.so.b4580 "CMakeFiles/ggml-hip.dir/__/ggml-cuda/acc.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/arange.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/argmax.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/argsort.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/binbcast.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/clamp.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/concat.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/conv-transpose-1d.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/convert.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/count-equal.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/cpy.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/cross-entropy-loss.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/diagmask.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn-tile-f16.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn-tile-f32.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/fattn.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/getrows.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/ggml-cuda.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/gla.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/im2col.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmq.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmv.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/mmvq.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/norm.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/opt-step-adamw.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/out-prod.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/pad.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/pool2d.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/quantize.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/rope.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/scale.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/softmax.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/sum.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/sumrows.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/tsembd.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/unary.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/upscale.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/wkv6.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb16.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqfloat-cpb32.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb16.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb32.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-wmma-f16-instance-kqhalf-cpb8.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq1_s.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_s.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_xs.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq2_xxs.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq3_s.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq3_xxs.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq4_nl.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-iq4_xs.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q2_k.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q3_k.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-iclang++: warning: argument unused during compilation: '-Xarch_host -fstack-protector-strong' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-Xarch_host -fcf-protection' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-specs=/usr/lib/rpm/redhat/redhat-package-notes' [-Wunused-command-line-argument] nstance-q4_0.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_1.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q4_k.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_0.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_1.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q5_k.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q6_k.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/mmq-instance-q8_0.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q4_0-q4_0.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q4_0-q4_0.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-q8_0-q8_0.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-q8_0-q8_0.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs128-f16-f16.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs256-f16-f16.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f16-instance-hs64-f16-f16.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs128-f16-f16.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs256-f16-f16.cu.o" "CMakeFiles/ggml-hip.dir/__/ggml-cuda/template-instances/fattn-vec-f32-instance-hs64-f16-f16.cu.o" ../../../bin/libggml-base.so.b4580 /usr/lib64/libhipblas.so.2.4 --hip-link --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 --offload-arch=gfx1010 --offload-arch=gfx1012 --offload-arch=gfx1030 --offload-arch=gfx1031 --offload-arch=gfx1035 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 --offload-arch=gfx1103 --offload-arch=gfx1150 --offload-arch=gfx1151 --offload-arch=gfx1152 --offload-arch=gfx1200 --offload-arch=gfx1201 /usr/lib64/librocblas.so.4.4 /usr/lib64/libamdhip64.so.6.4.43483 cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/ggml-hip && /usr/bin/cmake -E cmake_symlink_library ../../../bin/libggml-hip.so.b4580 ../../../bin/libggml-hip.so.b4580 ../../../bin/libggml-hip.so gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' [ 75%] Built target ggml-hip /usr/bin/gmake -f ggml/src/CMakeFiles/ggml.dir/build.make ggml/src/CMakeFiles/ggml.dir/depend gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580 /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src/CMakeFiles/ggml.dir/DependInfo.cmake "--color=" gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' /usr/bin/gmake -f ggml/src/CMakeFiles/ggml.dir/build.make ggml/src/CMakeFiles/ggml.dir/build gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' [ 75%] Building CXX object ggml/src/CMakeFiles/ggml.dir/ggml-backend-reg.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_BUILD -DGGML_SCHED_MAX_COPIES=4 -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -D_GNU_SOURCE -D_XOPEN_SOURCE=600 -Dggml_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -std=gnu++17 -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT ggml/src/CMakeFiles/ggml.dir/ggml-backend-reg.cpp.o -MF CMakeFiles/ggml.dir/ggml-backend-reg.cpp.o.d -o CMakeFiles/ggml.dir/ggml-backend-reg.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/ggml-backend-reg.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory [ 76%] Linking CXX shared library ../../bin/libggml.so cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/cmake -E cmake_link_script CMakeFiles/ggml.dir/link.txt --verbose=1 sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory clang++: warning: argument unused during compilation: '-Xarch_host -fstack-protector-strong' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-Xarch_host -fcf-protection' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-specs=/usr/lib/rpm/redhat/redhat-package-notes' [-Wunused-command-line-argument] /usr/bin/hipcc -fPIC -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -Xlinker --dependency-file=CMakeFiles/ggml.dir/link.d -Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes -shared -Wl,-soname,libggml.so.b4580 -o ../../bin/libggml.so.b4580 "CMakeFiles/ggml.dir/ggml-backend-reg.cpp.o" -ldl ../../bin/libggml-cpu.so.b4580 ../../bin/libggml-hip.so.b4580 ../../bin/libggml-base.so.b4580 cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/ggml/src && /usr/bin/cmake -E cmake_symlink_library ../../bin/libggml.so.b4580 ../../bin/libggml.so.b4580 ../../bin/libggml.so gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' [ 76%] Built target ggml /usr/bin/gmake -f src/CMakeFiles/llama.dir/build.make src/CMakeFiles/llama.dir/depend gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580 /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src/CMakeFiles/llama.dir/DependInfo.cmake "--color=" gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' /usr/bin/gmake -f src/CMakeFiles/llama.dir/build.make src/CMakeFiles/llama.dir/build gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' [ 78%] Building CXX object src/CMakeFiles/llama.dir/llama.cpp.o [ 78%] Building CXX object src/CMakeFiles/llama.dir/llama-batch.cpp.o [ 79%] Building CXX object src/CMakeFiles/llama.dir/llama-context.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-batch.cpp.o -MF CMakeFiles/llama.dir/llama-batch.cpp.o.d -o CMakeFiles/llama.dir/llama-batch.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-batch.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama.cpp.o -MF CMakeFiles/llama.dir/llama.cpp.o.d -o CMakeFiles/llama.dir/llama.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-context.cpp.o -MF CMakeFiles/llama.dir/llama-context.cpp.o.d -o CMakeFiles/llama.dir/llama-context.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-context.cpp [ 80%] Building CXX object src/CMakeFiles/llama.dir/llama-adapter.cpp.o [ 80%] Building CXX object src/CMakeFiles/llama.dir/llama-hparams.cpp.o [ 81%] Building CXX object src/CMakeFiles/llama.dir/llama-grammar.cpp.o [ 81%] Building CXX object src/CMakeFiles/llama.dir/llama-arch.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-adapter.cpp.o -MF CMakeFiles/llama.dir/llama-adapter.cpp.o.d -o CMakeFiles/llama.dir/llama-adapter.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-adapter.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-hparams.cpp.o -MF CMakeFiles/llama.dir/llama-hparams.cpp.o.d -o CMakeFiles/llama.dir/llama-hparams.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-hparams.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-arch.cpp.o -MF CMakeFiles/llama.dir/llama-arch.cpp.o.d -o CMakeFiles/llama.dir/llama-arch.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-arch.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-grammar.cpp.o -MF CMakeFiles/llama.dir/llama-grammar.cpp.o.d -o CMakeFiles/llama.dir/llama-grammar.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-grammar.cpp [ 82%] Building CXX object src/CMakeFiles/llama.dir/llama-chat.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-chat.cpp.o -MF CMakeFiles/llama.dir/llama-chat.cpp.o.d -o CMakeFiles/llama.dir/llama-chat.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-chat.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory [ 83%] Building CXX object src/CMakeFiles/llama.dir/llama-impl.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-impl.cpp.o -MF CMakeFiles/llama.dir/llama-impl.cpp.o.d -o CMakeFiles/llama.dir/llama-impl.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-impl.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory [ 84%] Building CXX object src/CMakeFiles/llama.dir/llama-kv-cache.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-kv-cache.cpp.o -MF CMakeFiles/llama.dir/llama-kv-cache.cpp.o.d -o CMakeFiles/llama.dir/llama-kv-cache.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-kv-cache.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory [ 85%] Building CXX object src/CMakeFiles/llama.dir/llama-mmap.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-mmap.cpp.o -MF CMakeFiles/llama.dir/llama-mmap.cpp.o.d -o CMakeFiles/llama.dir/llama-mmap.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-mmap.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory [ 86%] Building CXX object src/CMakeFiles/llama.dir/llama-model-loader.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-model-loader.cpp.o -MF CMakeFiles/llama.dir/llama-model-loader.cpp.o.d -o CMakeFiles/llama.dir/llama-model-loader.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-model-loader.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory [ 87%] Building CXX object src/CMakeFiles/llama.dir/llama-model.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-model.cpp.o -MF CMakeFiles/llama.dir/llama-model.cpp.o.d -o CMakeFiles/llama.dir/llama-model.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-model.cpp [ 87%] Building CXX object src/CMakeFiles/llama.dir/llama-quant.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-quant.cpp.o -MF CMakeFiles/llama.dir/llama-quant.cpp.o.d -o CMakeFiles/llama.dir/llama-quant.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-quant.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory [ 88%] Building CXX object src/CMakeFiles/llama.dir/llama-sampling.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-sampling.cpp.o -MF CMakeFiles/llama.dir/llama-sampling.cpp.o.d -o CMakeFiles/llama.dir/llama-sampling.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-sampling.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory [ 89%] Building CXX object src/CMakeFiles/llama.dir/llama-vocab.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/llama-vocab.cpp.o -MF CMakeFiles/llama.dir/llama-vocab.cpp.o.d -o CMakeFiles/llama.dir/llama-vocab.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/llama-vocab.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory [ 90%] Building CXX object src/CMakeFiles/llama.dir/unicode.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/unicode.cpp.o -MF CMakeFiles/llama.dir/unicode.cpp.o.d -o CMakeFiles/llama.dir/unicode.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/unicode.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory [ 91%] Building CXX object src/CMakeFiles/llama.dir/unicode-data.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_BUILD -DLLAMA_SHARED -Dllama_EXPORTS -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT src/CMakeFiles/llama.dir/unicode-data.cpp.o -MF CMakeFiles/llama.dir/unicode-data.cpp.o.d -o CMakeFiles/llama.dir/unicode-data.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/unicode-data.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory [ 92%] Linking CXX shared library ../bin/libllama.so cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/cmake -E cmake_link_script CMakeFiles/llama.dir/link.txt --verbose=1 sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory clang++: warning: argument unused during compilation: '-Xarch_host -fstack-protector-strong' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-Xarch_host -fcf-protection' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-specs=/usr/lib/rpm/redhat/redhat-package-notes' [-Wunused-command-line-argument] /usr/bin/hipcc -fPIC -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -Xlinker --dependency-file=CMakeFiles/llama.dir/link.d -Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes -shared -Wl,-soname,libllama.so.b4580 -o ../bin/libllama.so.b4580 CMakeFiles/llama.dir/llama.cpp.o "CMakeFiles/llama.dir/llama-adapter.cpp.o" "CMakeFiles/llama.dir/llama-arch.cpp.o" "CMakeFiles/llama.dir/llama-batch.cpp.o" "CMakeFiles/llama.dir/llama-chat.cpp.o" "CMakeFiles/llama.dir/llama-context.cpp.o" "CMakeFiles/llama.dir/llama-grammar.cpp.o" "CMakeFiles/llama.dir/llama-hparams.cpp.o" "CMakeFiles/llama.dir/llama-impl.cpp.o" "CMakeFiles/llama.dir/llama-kv-cache.cpp.o" "CMakeFiles/llama.dir/llama-mmap.cpp.o" "CMakeFiles/llama.dir/llama-model-loader.cpp.o" "CMakeFiles/llama.dir/llama-model.cpp.o" "CMakeFiles/llama.dir/llama-quant.cpp.o" "CMakeFiles/llama.dir/llama-sampling.cpp.o" "CMakeFiles/llama.dir/llama-vocab.cpp.o" CMakeFiles/llama.dir/unicode.cpp.o "CMakeFiles/llama.dir/unicode-data.cpp.o" ../bin/libggml.so.b4580 ../bin/libggml-cpu.so.b4580 ../bin/libggml-hip.so.b4580 ../bin/libggml-base.so.b4580 cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/src && /usr/bin/cmake -E cmake_symlink_library ../bin/libllama.so.b4580 ../bin/libllama.so.b4580 ../bin/libllama.so gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' [ 92%] Built target llama /usr/bin/gmake -f common/CMakeFiles/common.dir/build.make common/CMakeFiles/common.dir/depend gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580 /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common/CMakeFiles/common.dir/DependInfo.cmake "--color=" gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' /usr/bin/gmake -f common/CMakeFiles/common.dir/build.make common/CMakeFiles/common.dir/build gmake[2]: Entering directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' [ 93%] Building CXX object common/CMakeFiles/common.dir/arg.cpp.o [ 95%] Building CXX object common/CMakeFiles/common.dir/common.cpp.o [ 95%] Building CXX object common/CMakeFiles/common.dir/sampling.cpp.o [ 97%] Building CXX object common/CMakeFiles/common.dir/console.cpp.o [ 97%] Building CXX object common/CMakeFiles/common.dir/log.cpp.o [ 97%] Building CXX object common/CMakeFiles/common.dir/json-schema-to-grammar.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_SHARED -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT common/CMakeFiles/common.dir/arg.cpp.o -MF CMakeFiles/common.dir/arg.cpp.o.d -o CMakeFiles/common.dir/arg.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/arg.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_SHARED -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT common/CMakeFiles/common.dir/common.cpp.o -MF CMakeFiles/common.dir/common.cpp.o.d -o CMakeFiles/common.dir/common.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/common.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_SHARED -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT common/CMakeFiles/common.dir/console.cpp.o -MF CMakeFiles/common.dir/console.cpp.o.d -o CMakeFiles/common.dir/console.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/console.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_SHARED -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT common/CMakeFiles/common.dir/json-schema-to-grammar.cpp.o -MF CMakeFiles/common.dir/json-schema-to-grammar.cpp.o.d -o CMakeFiles/common.dir/json-schema-to-grammar.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/json-schema-to-grammar.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_SHARED -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT common/CMakeFiles/common.dir/log.cpp.o -MF CMakeFiles/common.dir/log.cpp.o.d -o CMakeFiles/common.dir/log.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/log.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_SHARED -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT common/CMakeFiles/common.dir/sampling.cpp.o -MF CMakeFiles/common.dir/sampling.cpp.o.d -o CMakeFiles/common.dir/sampling.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/sampling.cpp [ 98%] Building CXX object common/CMakeFiles/common.dir/ngram-cache.cpp.o [ 99%] Building CXX object common/CMakeFiles/common.dir/speculative.cpp.o cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_SHARED -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT common/CMakeFiles/common.dir/speculative.cpp.o -MF CMakeFiles/common.dir/speculative.cpp.o.d -o CMakeFiles/common.dir/speculative.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/speculative.cpp cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common && /usr/bin/hipcc -DGGML_BACKEND_SHARED -DGGML_SHARED -DGGML_USE_CPU -DGGML_USE_CUDA -DGGML_USE_HIP -DLLAMA_SHARED -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/. -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../include -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/src/../common -I/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/ggml/src/../include -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -DNDEBUG -fPIC -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wunreachable-code-break -Wunreachable-code-return -Wmissing-prototypes -Wextra-semi -MD -MT common/CMakeFiles/common.dir/ngram-cache.cpp.o -MF CMakeFiles/common.dir/ngram-cache.cpp.o.d -o CMakeFiles/common.dir/ngram-cache.cpp.o -c /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/common/ngram-cache.cpp sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory [100%] Linking CXX static library libcommon.a cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common && /usr/bin/cmake -P CMakeFiles/common.dir/cmake_clean_target.cmake cd /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/common && /usr/bin/cmake -E cmake_link_script CMakeFiles/common.dir/link.txt --verbose=1 bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record bfd plugin: LLVM gold plugin has failed to create LTO module: Invalid record /usr/bin/ar qc libcommon.a CMakeFiles/common.dir/arg.cpp.o CMakeFiles/common.dir/common.cpp.o CMakeFiles/common.dir/console.cpp.o "CMakeFiles/common.dir/json-schema-to-grammar.cpp.o" CMakeFiles/common.dir/log.cpp.o "CMakeFiles/common.dir/ngram-cache.cpp.o" CMakeFiles/common.dir/sampling.cpp.o CMakeFiles/common.dir/speculative.cpp.o "CMakeFiles/build_info.dir/build-info.cpp.o" /usr/bin/ranlib libcommon.a gmake[2]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' [100%] Built target common gmake[1]: Leaving directory '/builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build' /usr/bin/cmake -E cmake_progress_start /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/redhat-linux-build/CMakeFiles 0 + RPM_EC=0 ++ jobs -p + exit 0 Executing(%install): /bin/sh -e /var/tmp/rpm-tmp.rrH0PB + umask 022 + cd /builddir/build/BUILD/llama-cpp-b4580-build + '[' /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT '!=' / ']' + rm -rf /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT ++ dirname /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT + mkdir -p /builddir/build/BUILD/llama-cpp-b4580-build + mkdir /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT + CFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + cd llama.cpp-b4580 + DESTDIR=/builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT + /usr/bin/cmake --install redhat-linux-build -- Install configuration: "Release" -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/libggml-cpu.so.b4580 -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/libggml-cpu.so -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/libggml-hip.so.b4580 -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/libggml-hip.so -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/libggml.so.b4580 -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/libggml.so -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/ggml.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/ggml-cpu.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/ggml-alloc.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/ggml-backend.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/ggml-blas.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/ggml-cann.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/ggml-cuda.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/ggml-kompute.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/ggml-opt.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/ggml-metal.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/ggml-rpc.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/ggml-sycl.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/ggml-vulkan.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/gguf.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/libggml-base.so.b4580 -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/libggml-base.so -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/cmake/ggml/ggml-config.cmake -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/cmake/ggml/ggml-version.cmake -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/libllama.so.b4580 -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/libllama.so -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/llama.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/include/llama-cpp.h -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/cmake/llama/llama-config.cmake -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/cmake/llama/llama-version.cmake -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/bin/convert_hf_to_gguf.py -- Installing: /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib/pkgconfig/llama.pc + rm -rf '/builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/lib64/libggml_shared.*' + rm /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/bin/convert_hf_to_gguf.py + /usr/bin/find-debuginfo -j8 --strict-build-id -m -i --build-id-seed b4580-3.fc43 --unique-debug-suffix -b4580-3.fc43.x86_64 --unique-debug-src-base llama-cpp-b4580-3.fc43.x86_64 --run-dwz --dwz-low-mem-die-limit 10000000 --dwz-max-die-limit 110000000 -S debugsourcefiles.list /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580 find-debuginfo: starting Extracting debug info from 5 files DWARF-compressing 5 files dwz: ./usr/lib64/libggml-base.so.b4580-b4580-3.fc43.x86_64.debug: Unknown debugging section .debug_str_offsets dwz: ./usr/lib64/libggml-cpu.so.b4580-b4580-3.fc43.x86_64.debug: Unknown debugging section .debug_str_offsets dwz: ./usr/lib64/libggml-hip.so.b4580-b4580-3.fc43.x86_64.debug: Unknown debugging section .debug_str_offsets dwz: ./usr/lib64/libggml.so.b4580-b4580-3.fc43.x86_64.debug: Unknown debugging section .debug_str_offsets dwz: ./usr/lib64/libllama.so.b4580-b4580-3.fc43.x86_64.debug: Unknown debugging section .debug_str_offsets dwz: Too few files for multifile optimization sepdebugcrcfix: Updated 0 CRC32s, 5 CRC32s did match. Creating .debug symlinks for symlinks to ELF files Copying sources found by 'debugedit -l' to /usr/src/debug/llama-cpp-b4580-3.fc43.x86_64 find-debuginfo: done + /usr/lib/rpm/check-buildroot + /usr/lib/rpm/redhat/brp-ldconfig + /usr/lib/rpm/brp-compress + /usr/lib/rpm/redhat/brp-strip-lto /usr/bin/strip + /usr/lib/rpm/brp-strip-static-archive /usr/bin/strip + /usr/lib/rpm/check-rpaths + /usr/lib/rpm/redhat/brp-mangle-shebangs + /usr/lib/rpm/brp-remove-la-files + /usr/lib/rpm/redhat/brp-python-rpm-in-distinfo + env /usr/lib/rpm/redhat/brp-python-bytecompile '' 1 0 -j8 + /usr/lib/rpm/redhat/brp-python-hardlink + /usr/bin/add-determinism --brp -j8 /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT Scanned 32 directories and 208 files, processed 0 inodes, 0 modified (0 replaced + 0 rewritten), 0 unsupported format, 0 errors Reading /builddir/build/BUILD/llama-cpp-b4580-build/SPECPARTS/rpm-debuginfo.specpart Processing files: llama-cpp-b4580-3.fc43.x86_64 Executing(%license): /bin/sh -e /var/tmp/rpm-tmp.1YE5Cs + umask 022 + cd /builddir/build/BUILD/llama-cpp-b4580-build + cd llama.cpp-b4580 + LICENSEDIR=/builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/share/licenses/llama-cpp + export LC_ALL=C.UTF-8 + LC_ALL=C.UTF-8 + export LICENSEDIR + /usr/bin/mkdir -p /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/share/licenses/llama-cpp + cp -pr /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/LICENSE /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/share/licenses/llama-cpp + RPM_EC=0 ++ jobs -p + exit 0 Provides: libggml-base.so.b4580()(64bit) libggml-cpu.so.b4580()(64bit) libggml-hip.so.b4580()(64bit) libggml.so.b4580()(64bit) libllama.so.b4580()(64bit) llama-cpp = b4580-3.fc43 llama-cpp(x86-64) = b4580-3.fc43 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Requires: ld-linux-x86-64.so.2()(64bit) ld-linux-x86-64.so.2(GLIBC_2.3)(64bit) libamdhip64.so.6()(64bit) libamdhip64.so.6(hip_4.2)(64bit) libamdhip64.so.6(hip_6.0)(64bit) libc.so.6()(64bit) libc.so.6(GLIBC_2.14)(64bit) libc.so.6(GLIBC_2.17)(64bit) libc.so.6(GLIBC_2.2.5)(64bit) libc.so.6(GLIBC_2.29)(64bit) libc.so.6(GLIBC_2.3.2)(64bit) libc.so.6(GLIBC_2.3.4)(64bit) libc.so.6(GLIBC_2.32)(64bit) libc.so.6(GLIBC_2.33)(64bit) libc.so.6(GLIBC_2.34)(64bit) libc.so.6(GLIBC_2.38)(64bit) libc.so.6(GLIBC_2.4)(64bit) libc.so.6(GLIBC_2.7)(64bit) libc.so.6(GLIBC_ABI_DT_RELR)(64bit) libgcc_s.so.1()(64bit) libgcc_s.so.1(GCC_3.0)(64bit) libggml-base.so.b4580()(64bit) libggml-cpu.so.b4580()(64bit) libggml-hip.so.b4580()(64bit) libggml.so.b4580()(64bit) libhipblas.so.2()(64bit) libm.so.6()(64bit) libm.so.6(GLIBC_2.2.5)(64bit) libm.so.6(GLIBC_2.27)(64bit) libm.so.6(GLIBC_2.29)(64bit) librocblas.so.4()(64bit) libstdc++.so.6()(64bit) libstdc++.so.6(CXXABI_1.3)(64bit) libstdc++.so.6(CXXABI_1.3.11)(64bit) libstdc++.so.6(CXXABI_1.3.13)(64bit) libstdc++.so.6(CXXABI_1.3.2)(64bit) libstdc++.so.6(CXXABI_1.3.3)(64bit) libstdc++.so.6(CXXABI_1.3.5)(64bit) libstdc++.so.6(CXXABI_1.3.9)(64bit) libstdc++.so.6(GLIBCXX_3.4)(64bit) libstdc++.so.6(GLIBCXX_3.4.11)(64bit) libstdc++.so.6(GLIBCXX_3.4.14)(64bit) libstdc++.so.6(GLIBCXX_3.4.15)(64bit) libstdc++.so.6(GLIBCXX_3.4.17)(64bit) libstdc++.so.6(GLIBCXX_3.4.18)(64bit) libstdc++.so.6(GLIBCXX_3.4.19)(64bit) libstdc++.so.6(GLIBCXX_3.4.20)(64bit) libstdc++.so.6(GLIBCXX_3.4.21)(64bit) libstdc++.so.6(GLIBCXX_3.4.22)(64bit) libstdc++.so.6(GLIBCXX_3.4.25)(64bit) libstdc++.so.6(GLIBCXX_3.4.26)(64bit) libstdc++.so.6(GLIBCXX_3.4.29)(64bit) libstdc++.so.6(GLIBCXX_3.4.30)(64bit) libstdc++.so.6(GLIBCXX_3.4.9)(64bit) Recommends: numactl Processing files: llama-cpp-devel-b4580-3.fc43.x86_64 Executing(%doc): /bin/sh -e /var/tmp/rpm-tmp.4kubEq + umask 022 + cd /builddir/build/BUILD/llama-cpp-b4580-build + cd llama.cpp-b4580 + DOCDIR=/builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/share/doc/llama-cpp-devel + export LC_ALL=C.UTF-8 + LC_ALL=C.UTF-8 + export DOCDIR + /usr/bin/mkdir -p /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/share/doc/llama-cpp-devel + cp -pr /builddir/build/BUILD/llama-cpp-b4580-build/llama.cpp-b4580/README.md /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT/usr/share/doc/llama-cpp-devel + RPM_EC=0 ++ jobs -p + exit 0 Provides: cmake(ggml) cmake(llama) llama-cpp-devel = b4580-3.fc43 llama-cpp-devel(x86-64) = b4580-3.fc43 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Requires: cmake-filesystem(x86-64) libggml-base.so.b4580()(64bit) libggml-cpu.so.b4580()(64bit) libggml-hip.so.b4580()(64bit) libggml.so.b4580()(64bit) libllama.so.b4580()(64bit) Processing files: llama-cpp-debugsource-b4580-3.fc43.x86_64 Provides: llama-cpp-debugsource = b4580-3.fc43 llama-cpp-debugsource(x86-64) = b4580-3.fc43 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Processing files: llama-cpp-debuginfo-b4580-3.fc43.x86_64 Provides: debuginfo(build-id) = 01f3de58952e35298c2e35884a52b43de76c4b4a debuginfo(build-id) = 373bfd4f35803c1a8ec32741c720f024ed638743 debuginfo(build-id) = 4182fed7db581a4cd6dd079322ed0d126bd74c0a debuginfo(build-id) = 48101ef7f70429b71c1a028e7303166f394f6e89 debuginfo(build-id) = 7363847e129cf2f5803014ff6d2a57383074574f libggml-base.so.b4580-b4580-3.fc43.x86_64.debug()(64bit) libggml-cpu.so.b4580-b4580-3.fc43.x86_64.debug()(64bit) libggml-hip.so.b4580-b4580-3.fc43.x86_64.debug()(64bit) libggml.so.b4580-b4580-3.fc43.x86_64.debug()(64bit) libllama.so.b4580-b4580-3.fc43.x86_64.debug()(64bit) llama-cpp-debuginfo = b4580-3.fc43 llama-cpp-debuginfo(x86-64) = b4580-3.fc43 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Recommends: llama-cpp-debugsource(x86-64) = b4580-3.fc43 Checking for unpackaged file(s): /usr/lib/rpm/check-files /builddir/build/BUILD/llama-cpp-b4580-build/BUILDROOT Wrote: /builddir/build/RPMS/llama-cpp-devel-b4580-3.fc43.x86_64.rpm Wrote: /builddir/build/RPMS/llama-cpp-debugsource-b4580-3.fc43.x86_64.rpm Wrote: /builddir/build/RPMS/llama-cpp-debuginfo-b4580-3.fc43.x86_64.rpm Wrote: /builddir/build/RPMS/llama-cpp-b4580-3.fc43.x86_64.rpm Child return code was: 0